Files
r2egym-nl2bash-bugsseq/trainer_state.json
ModelHub XC 2ccf1f0e56 初始化项目,由ModelHub XC社区提供模型
Model: laion/r2egym-nl2bash-bugsseq
Source: Original Platform
2026-05-05 19:55:55 +08:00

18968 lines
527 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 6.999592999592999,
"eval_steps": 500,
"global_step": 8602,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.00407000407000407,
"grad_norm": 16.688738856727717,
"learning_rate": 1.8583042973286877e-07,
"loss": 0.6602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.309528112411499,
"step": 5,
"valid_targets_mean": 7389.0,
"valid_targets_min": 5627
},
{
"epoch": 0.00814000814000814,
"grad_norm": 16.284518291358502,
"learning_rate": 4.181184668989548e-07,
"loss": 0.7004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23656058311462402,
"step": 10,
"valid_targets_mean": 1294.8,
"valid_targets_min": 422
},
{
"epoch": 0.01221001221001221,
"grad_norm": 14.7645423037296,
"learning_rate": 6.504065040650407e-07,
"loss": 0.6791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3238072991371155,
"step": 15,
"valid_targets_mean": 8539.9,
"valid_targets_min": 6761
},
{
"epoch": 0.01628001628001628,
"grad_norm": 13.258019811923578,
"learning_rate": 8.826945412311266e-07,
"loss": 0.6127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28863972425460815,
"step": 20,
"valid_targets_mean": 7579.0,
"valid_targets_min": 6174
},
{
"epoch": 0.02035002035002035,
"grad_norm": 10.994253756620328,
"learning_rate": 1.1149825783972125e-06,
"loss": 0.6115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29230475425720215,
"step": 25,
"valid_targets_mean": 7328.2,
"valid_targets_min": 4839
},
{
"epoch": 0.02442002442002442,
"grad_norm": 7.768784524679733,
"learning_rate": 1.3472706155632985e-06,
"loss": 0.604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3191682696342468,
"step": 30,
"valid_targets_mean": 6838.2,
"valid_targets_min": 5034
},
{
"epoch": 0.02849002849002849,
"grad_norm": 5.751080564869644,
"learning_rate": 1.5795586527293845e-06,
"loss": 0.5845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29048168659210205,
"step": 35,
"valid_targets_mean": 7248.2,
"valid_targets_min": 5567
},
{
"epoch": 0.03256003256003256,
"grad_norm": 5.28995649654892,
"learning_rate": 1.8118466898954705e-06,
"loss": 0.5404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563433349132538,
"step": 40,
"valid_targets_mean": 6234.0,
"valid_targets_min": 5603
},
{
"epoch": 0.03663003663003663,
"grad_norm": 6.617277965973996,
"learning_rate": 2.0441347270615568e-06,
"loss": 0.5329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12342505156993866,
"step": 45,
"valid_targets_mean": 602.0,
"valid_targets_min": 152
},
{
"epoch": 0.0407000407000407,
"grad_norm": 3.0152890224296596,
"learning_rate": 2.2764227642276426e-06,
"loss": 0.4588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22148989140987396,
"step": 50,
"valid_targets_mean": 7299.9,
"valid_targets_min": 6158
},
{
"epoch": 0.04477004477004477,
"grad_norm": 2.061368844016502,
"learning_rate": 2.5087108013937284e-06,
"loss": 0.4436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2079901248216629,
"step": 55,
"valid_targets_mean": 6140.0,
"valid_targets_min": 4648
},
{
"epoch": 0.04884004884004884,
"grad_norm": 1.356693424104223,
"learning_rate": 2.7409988385598146e-06,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21061325073242188,
"step": 60,
"valid_targets_mean": 6603.0,
"valid_targets_min": 4882
},
{
"epoch": 0.05291005291005291,
"grad_norm": 1.0151992206933238,
"learning_rate": 2.9732868757259004e-06,
"loss": 0.4018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20564204454421997,
"step": 65,
"valid_targets_mean": 8015.0,
"valid_targets_min": 6344
},
{
"epoch": 0.05698005698005698,
"grad_norm": 0.8990999330833235,
"learning_rate": 3.205574912891986e-06,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18953731656074524,
"step": 70,
"valid_targets_mean": 6305.2,
"valid_targets_min": 4622
},
{
"epoch": 0.06105006105006105,
"grad_norm": 0.7436312346393562,
"learning_rate": 3.4378629500580724e-06,
"loss": 0.392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20007365942001343,
"step": 75,
"valid_targets_mean": 7890.8,
"valid_targets_min": 5485
},
{
"epoch": 0.06512006512006512,
"grad_norm": 0.6714920662823174,
"learning_rate": 3.670150987224158e-06,
"loss": 0.387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.175824835896492,
"step": 80,
"valid_targets_mean": 7016.6,
"valid_targets_min": 4960
},
{
"epoch": 0.06919006919006919,
"grad_norm": 0.6272831883685218,
"learning_rate": 3.902439024390244e-06,
"loss": 0.373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17543438076972961,
"step": 85,
"valid_targets_mean": 6527.1,
"valid_targets_min": 5399
},
{
"epoch": 0.07326007326007326,
"grad_norm": 0.7089605501278246,
"learning_rate": 4.13472706155633e-06,
"loss": 0.3711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18534767627716064,
"step": 90,
"valid_targets_mean": 4995.0,
"valid_targets_min": 618
},
{
"epoch": 0.07733007733007732,
"grad_norm": 0.5692706983764877,
"learning_rate": 4.367015098722416e-06,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1900652050971985,
"step": 95,
"valid_targets_mean": 7219.4,
"valid_targets_min": 5764
},
{
"epoch": 0.0814000814000814,
"grad_norm": 0.5526365515310625,
"learning_rate": 4.599303135888502e-06,
"loss": 0.364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18986254930496216,
"step": 100,
"valid_targets_mean": 7998.5,
"valid_targets_min": 5902
},
{
"epoch": 0.08547008547008547,
"grad_norm": 0.5591512425354309,
"learning_rate": 4.831591173054588e-06,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1477121263742447,
"step": 105,
"valid_targets_mean": 7377.4,
"valid_targets_min": 5015
},
{
"epoch": 0.08954008954008955,
"grad_norm": 0.47170286143316387,
"learning_rate": 5.063879210220674e-06,
"loss": 0.3322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14665284752845764,
"step": 110,
"valid_targets_mean": 6794.0,
"valid_targets_min": 5283
},
{
"epoch": 0.0936100936100936,
"grad_norm": 0.546971917140672,
"learning_rate": 5.29616724738676e-06,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1953507661819458,
"step": 115,
"valid_targets_mean": 6656.4,
"valid_targets_min": 4364
},
{
"epoch": 0.09768009768009768,
"grad_norm": 0.4730703657980557,
"learning_rate": 5.528455284552846e-06,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1581360101699829,
"step": 120,
"valid_targets_mean": 7178.4,
"valid_targets_min": 4448
},
{
"epoch": 0.10175010175010175,
"grad_norm": 0.5438344423212753,
"learning_rate": 5.7607433217189324e-06,
"loss": 0.3264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18480417132377625,
"step": 125,
"valid_targets_mean": 7619.8,
"valid_targets_min": 5737
},
{
"epoch": 0.10582010582010581,
"grad_norm": 0.42704045318550676,
"learning_rate": 5.993031358885018e-06,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13994517922401428,
"step": 130,
"valid_targets_mean": 8754.4,
"valid_targets_min": 5752
},
{
"epoch": 0.10989010989010989,
"grad_norm": 0.5266020359474044,
"learning_rate": 6.225319396051104e-06,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15675979852676392,
"step": 135,
"valid_targets_mean": 6341.0,
"valid_targets_min": 4543
},
{
"epoch": 0.11396011396011396,
"grad_norm": 0.5048534740315108,
"learning_rate": 6.45760743321719e-06,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15559503436088562,
"step": 140,
"valid_targets_mean": 7181.9,
"valid_targets_min": 4563
},
{
"epoch": 0.11803011803011804,
"grad_norm": 1.134587905553992,
"learning_rate": 6.6898954703832765e-06,
"loss": 0.3357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12442926317453384,
"step": 145,
"valid_targets_mean": 1104.4,
"valid_targets_min": 161
},
{
"epoch": 0.1221001221001221,
"grad_norm": 0.4270206279409013,
"learning_rate": 6.922183507549362e-06,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13907991349697113,
"step": 150,
"valid_targets_mean": 7018.2,
"valid_targets_min": 5424
},
{
"epoch": 0.12617012617012616,
"grad_norm": 0.4635086442233948,
"learning_rate": 7.154471544715448e-06,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1630023717880249,
"step": 155,
"valid_targets_mean": 7738.4,
"valid_targets_min": 5329
},
{
"epoch": 0.13024013024013023,
"grad_norm": 0.5079812404242928,
"learning_rate": 7.386759581881534e-06,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1584567427635193,
"step": 160,
"valid_targets_mean": 6426.6,
"valid_targets_min": 5560
},
{
"epoch": 0.1343101343101343,
"grad_norm": 0.5050284094328902,
"learning_rate": 7.61904761904762e-06,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16165009140968323,
"step": 165,
"valid_targets_mean": 6169.9,
"valid_targets_min": 3446
},
{
"epoch": 0.13838013838013838,
"grad_norm": 0.498091820817201,
"learning_rate": 7.851335656213705e-06,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15471090376377106,
"step": 170,
"valid_targets_mean": 7204.6,
"valid_targets_min": 5381
},
{
"epoch": 0.14245014245014245,
"grad_norm": 0.48505113847764975,
"learning_rate": 8.083623693379791e-06,
"loss": 0.3053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1558820754289627,
"step": 175,
"valid_targets_mean": 7600.4,
"valid_targets_min": 5241
},
{
"epoch": 0.14652014652014653,
"grad_norm": 0.4895882936126897,
"learning_rate": 8.315911730545877e-06,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16261817514896393,
"step": 180,
"valid_targets_mean": 7098.5,
"valid_targets_min": 5607
},
{
"epoch": 0.1505901505901506,
"grad_norm": 0.49703616694051983,
"learning_rate": 8.548199767711964e-06,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15736651420593262,
"step": 185,
"valid_targets_mean": 6955.1,
"valid_targets_min": 5530
},
{
"epoch": 0.15466015466015465,
"grad_norm": 0.47329084552349354,
"learning_rate": 8.78048780487805e-06,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15062673389911652,
"step": 190,
"valid_targets_mean": 6748.1,
"valid_targets_min": 5364
},
{
"epoch": 0.15873015873015872,
"grad_norm": 0.5304350179179551,
"learning_rate": 9.012775842044136e-06,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14595365524291992,
"step": 195,
"valid_targets_mean": 6273.9,
"valid_targets_min": 5438
},
{
"epoch": 0.1628001628001628,
"grad_norm": 0.4804611842699093,
"learning_rate": 9.24506387921022e-06,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14614039659500122,
"step": 200,
"valid_targets_mean": 6419.5,
"valid_targets_min": 4879
},
{
"epoch": 0.16687016687016687,
"grad_norm": 1.0372553917536562,
"learning_rate": 9.477351916376307e-06,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1451706886291504,
"step": 205,
"valid_targets_mean": 6483.4,
"valid_targets_min": 4309
},
{
"epoch": 0.17094017094017094,
"grad_norm": 0.5083493341784381,
"learning_rate": 9.709639953542393e-06,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16406603157520294,
"step": 210,
"valid_targets_mean": 6825.0,
"valid_targets_min": 5205
},
{
"epoch": 0.17501017501017502,
"grad_norm": 0.46301643664731623,
"learning_rate": 9.94192799070848e-06,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13244540989398956,
"step": 215,
"valid_targets_mean": 6729.4,
"valid_targets_min": 5200
},
{
"epoch": 0.1790801790801791,
"grad_norm": 0.49215202614656767,
"learning_rate": 1.0174216027874565e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13969576358795166,
"step": 220,
"valid_targets_mean": 6094.0,
"valid_targets_min": 5302
},
{
"epoch": 0.18315018315018314,
"grad_norm": 0.4871918972499842,
"learning_rate": 1.0406504065040652e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14923205971717834,
"step": 225,
"valid_targets_mean": 7140.0,
"valid_targets_min": 5270
},
{
"epoch": 0.1872201872201872,
"grad_norm": 0.4471280600208976,
"learning_rate": 1.0638792102206736e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.131822407245636,
"step": 230,
"valid_targets_mean": 7425.0,
"valid_targets_min": 5281
},
{
"epoch": 0.19129019129019129,
"grad_norm": 1.2605795171969003,
"learning_rate": 1.0871080139372822e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726950705051422,
"step": 235,
"valid_targets_mean": 7063.4,
"valid_targets_min": 5386
},
{
"epoch": 0.19536019536019536,
"grad_norm": 0.4932596835670058,
"learning_rate": 1.1103368176538909e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14937910437583923,
"step": 240,
"valid_targets_mean": 6827.0,
"valid_targets_min": 4547
},
{
"epoch": 0.19943019943019943,
"grad_norm": 0.9167985105196412,
"learning_rate": 1.1335656213704995e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09083765000104904,
"step": 245,
"valid_targets_mean": 2047.0,
"valid_targets_min": 165
},
{
"epoch": 0.2035002035002035,
"grad_norm": 0.4621000775660505,
"learning_rate": 1.1567944250871081e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1386224627494812,
"step": 250,
"valid_targets_mean": 6754.1,
"valid_targets_min": 5196
},
{
"epoch": 0.20757020757020758,
"grad_norm": 0.5251600558673276,
"learning_rate": 1.1800232288037167e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13912081718444824,
"step": 255,
"valid_targets_mean": 5985.6,
"valid_targets_min": 5028
},
{
"epoch": 0.21164021164021163,
"grad_norm": 0.5423901600668142,
"learning_rate": 1.2032520325203254e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12727007269859314,
"step": 260,
"valid_targets_mean": 5963.9,
"valid_targets_min": 5237
},
{
"epoch": 0.2157102157102157,
"grad_norm": 0.5203028801997557,
"learning_rate": 1.2264808362369338e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1433340162038803,
"step": 265,
"valid_targets_mean": 6319.0,
"valid_targets_min": 5412
},
{
"epoch": 0.21978021978021978,
"grad_norm": 0.5281674096137197,
"learning_rate": 1.2497096399535424e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11158867180347443,
"step": 270,
"valid_targets_mean": 7125.8,
"valid_targets_min": 5080
},
{
"epoch": 0.22385022385022385,
"grad_norm": 0.6582757970482628,
"learning_rate": 1.272938443670151e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13590899109840393,
"step": 275,
"valid_targets_mean": 6123.5,
"valid_targets_min": 4521
},
{
"epoch": 0.22792022792022792,
"grad_norm": 2.7614047900823837,
"learning_rate": 1.2961672473867597e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24310331046581268,
"step": 280,
"valid_targets_mean": 1886.0,
"valid_targets_min": 1111
},
{
"epoch": 0.231990231990232,
"grad_norm": 1.5491066018218123,
"learning_rate": 1.3193960511033683e-05,
"loss": 0.4133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20701418817043304,
"step": 285,
"valid_targets_mean": 1497.6,
"valid_targets_min": 893
},
{
"epoch": 0.23606023606023607,
"grad_norm": 1.1536064750715551,
"learning_rate": 1.3426248548199769e-05,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1264546811580658,
"step": 290,
"valid_targets_mean": 1356.0,
"valid_targets_min": 914
},
{
"epoch": 0.24013024013024012,
"grad_norm": 1.2647474847869884,
"learning_rate": 1.3658536585365855e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1455959528684616,
"step": 295,
"valid_targets_mean": 1324.5,
"valid_targets_min": 680
},
{
"epoch": 0.2442002442002442,
"grad_norm": 0.997749848075399,
"learning_rate": 1.389082462253194e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15397366881370544,
"step": 300,
"valid_targets_mean": 1931.8,
"valid_targets_min": 876
},
{
"epoch": 0.24827024827024827,
"grad_norm": 1.0630278095878878,
"learning_rate": 1.4123112659698026e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1414937824010849,
"step": 305,
"valid_targets_mean": 1292.2,
"valid_targets_min": 734
},
{
"epoch": 0.2523402523402523,
"grad_norm": 0.9931657056115516,
"learning_rate": 1.4355400696864112e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1270873248577118,
"step": 310,
"valid_targets_mean": 1469.6,
"valid_targets_min": 655
},
{
"epoch": 0.2564102564102564,
"grad_norm": 1.1018628472649998,
"learning_rate": 1.4587688734030199e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15461672842502594,
"step": 315,
"valid_targets_mean": 1548.4,
"valid_targets_min": 737
},
{
"epoch": 0.26048026048026046,
"grad_norm": 1.0914493892414534,
"learning_rate": 1.4819976771196285e-05,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13322024047374725,
"step": 320,
"valid_targets_mean": 1316.5,
"valid_targets_min": 759
},
{
"epoch": 0.26455026455026454,
"grad_norm": 1.1154554492176114,
"learning_rate": 1.5052264808362371e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11124762892723083,
"step": 325,
"valid_targets_mean": 1249.6,
"valid_targets_min": 753
},
{
"epoch": 0.2686202686202686,
"grad_norm": 1.056667017250088,
"learning_rate": 1.528455284552846e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18556742370128632,
"step": 330,
"valid_targets_mean": 1833.0,
"valid_targets_min": 927
},
{
"epoch": 0.2726902726902727,
"grad_norm": 1.004899439380304,
"learning_rate": 1.5516840882694542e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14251361787319183,
"step": 335,
"valid_targets_mean": 1338.4,
"valid_targets_min": 679
},
{
"epoch": 0.27676027676027676,
"grad_norm": 1.1790950500190507,
"learning_rate": 1.5749128919860628e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12715528905391693,
"step": 340,
"valid_targets_mean": 1244.6,
"valid_targets_min": 771
},
{
"epoch": 0.28083028083028083,
"grad_norm": 1.3870604631519712,
"learning_rate": 1.5981416957026714e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12742307782173157,
"step": 345,
"valid_targets_mean": 1732.5,
"valid_targets_min": 986
},
{
"epoch": 0.2849002849002849,
"grad_norm": 1.0033141410182251,
"learning_rate": 1.62137049941928e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12324304133653641,
"step": 350,
"valid_targets_mean": 1389.9,
"valid_targets_min": 1103
},
{
"epoch": 0.288970288970289,
"grad_norm": 1.0333697812051308,
"learning_rate": 1.6445993031358887e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15279968082904816,
"step": 355,
"valid_targets_mean": 1593.2,
"valid_targets_min": 675
},
{
"epoch": 0.29304029304029305,
"grad_norm": 0.915729241739608,
"learning_rate": 1.6678281068524973e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16900552809238434,
"step": 360,
"valid_targets_mean": 1926.6,
"valid_targets_min": 974
},
{
"epoch": 0.29711029711029713,
"grad_norm": 1.0882207091700582,
"learning_rate": 1.691056910569106e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1652759164571762,
"step": 365,
"valid_targets_mean": 1953.1,
"valid_targets_min": 869
},
{
"epoch": 0.3011803011803012,
"grad_norm": 0.9858438574283391,
"learning_rate": 1.7142857142857142e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12480325996875763,
"step": 370,
"valid_targets_mean": 1327.2,
"valid_targets_min": 1023
},
{
"epoch": 0.3052503052503053,
"grad_norm": 0.9782058898631699,
"learning_rate": 1.7375145180023228e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14944294095039368,
"step": 375,
"valid_targets_mean": 1717.9,
"valid_targets_min": 709
},
{
"epoch": 0.3093203093203093,
"grad_norm": 1.2128421132256473,
"learning_rate": 1.7607433217189314e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11604733765125275,
"step": 380,
"valid_targets_mean": 1139.9,
"valid_targets_min": 658
},
{
"epoch": 0.31339031339031337,
"grad_norm": 1.2503504626315993,
"learning_rate": 1.78397212543554e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13267236948013306,
"step": 385,
"valid_targets_mean": 1444.8,
"valid_targets_min": 662
},
{
"epoch": 0.31746031746031744,
"grad_norm": 1.0828865674968162,
"learning_rate": 1.807200929152149e-05,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09767653793096542,
"step": 390,
"valid_targets_mean": 1242.2,
"valid_targets_min": 859
},
{
"epoch": 0.3215303215303215,
"grad_norm": 1.0500436494857386,
"learning_rate": 1.8304297328687576e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15620818734169006,
"step": 395,
"valid_targets_mean": 1569.2,
"valid_targets_min": 950
},
{
"epoch": 0.3256003256003256,
"grad_norm": 1.2368316222797435,
"learning_rate": 1.8536585365853663e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12553861737251282,
"step": 400,
"valid_targets_mean": 1539.8,
"valid_targets_min": 686
},
{
"epoch": 0.32967032967032966,
"grad_norm": 0.970316022027174,
"learning_rate": 1.8768873403019745e-05,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14505316317081451,
"step": 405,
"valid_targets_mean": 1610.6,
"valid_targets_min": 702
},
{
"epoch": 0.33374033374033374,
"grad_norm": 1.028981175641749,
"learning_rate": 1.900116144018583e-05,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09692301601171494,
"step": 410,
"valid_targets_mean": 1190.4,
"valid_targets_min": 779
},
{
"epoch": 0.3378103378103378,
"grad_norm": 1.079548761208398,
"learning_rate": 1.9233449477351918e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1386578381061554,
"step": 415,
"valid_targets_mean": 1467.1,
"valid_targets_min": 822
},
{
"epoch": 0.3418803418803419,
"grad_norm": 1.0316182713272737,
"learning_rate": 1.9465737514518004e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10993292927742004,
"step": 420,
"valid_targets_mean": 1350.5,
"valid_targets_min": 868
},
{
"epoch": 0.34595034595034596,
"grad_norm": 1.1022256452208465,
"learning_rate": 1.969802555168409e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10702995955944061,
"step": 425,
"valid_targets_mean": 1283.5,
"valid_targets_min": 781
},
{
"epoch": 0.35002035002035004,
"grad_norm": 0.9493395584058351,
"learning_rate": 1.9930313588850176e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10873595625162125,
"step": 430,
"valid_targets_mean": 1303.2,
"valid_targets_min": 793
},
{
"epoch": 0.3540903540903541,
"grad_norm": 1.0733764593758766,
"learning_rate": 2.016260162601626e-05,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11143694072961807,
"step": 435,
"valid_targets_mean": 1309.1,
"valid_targets_min": 806
},
{
"epoch": 0.3581603581603582,
"grad_norm": 0.9098321906535183,
"learning_rate": 2.039488966318235e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10678255558013916,
"step": 440,
"valid_targets_mean": 1397.6,
"valid_targets_min": 803
},
{
"epoch": 0.36223036223036226,
"grad_norm": 0.9876007650935522,
"learning_rate": 2.0627177700348432e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09560855478048325,
"step": 445,
"valid_targets_mean": 1187.8,
"valid_targets_min": 660
},
{
"epoch": 0.3663003663003663,
"grad_norm": 0.9221536800328648,
"learning_rate": 2.085946573751452e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10400258004665375,
"step": 450,
"valid_targets_mean": 1547.0,
"valid_targets_min": 853
},
{
"epoch": 0.37037037037037035,
"grad_norm": 1.1802888394338766,
"learning_rate": 2.1091753774680604e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13287541270256042,
"step": 455,
"valid_targets_mean": 1704.2,
"valid_targets_min": 719
},
{
"epoch": 0.3744403744403744,
"grad_norm": 0.9714075439297265,
"learning_rate": 2.132404181184669e-05,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09262743592262268,
"step": 460,
"valid_targets_mean": 1255.0,
"valid_targets_min": 765
},
{
"epoch": 0.3785103785103785,
"grad_norm": 0.9864351204877326,
"learning_rate": 2.1556329849012777e-05,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12507298588752747,
"step": 465,
"valid_targets_mean": 1550.8,
"valid_targets_min": 875
},
{
"epoch": 0.38258038258038257,
"grad_norm": 1.0261001318904166,
"learning_rate": 2.1788617886178863e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12351306527853012,
"step": 470,
"valid_targets_mean": 1362.0,
"valid_targets_min": 739
},
{
"epoch": 0.38665038665038665,
"grad_norm": 0.9746834269517334,
"learning_rate": 2.202090592334495e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14458400011062622,
"step": 475,
"valid_targets_mean": 1666.8,
"valid_targets_min": 760
},
{
"epoch": 0.3907203907203907,
"grad_norm": 1.0332993949409497,
"learning_rate": 2.2253193960511035e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10632194578647614,
"step": 480,
"valid_targets_mean": 1319.6,
"valid_targets_min": 1046
},
{
"epoch": 0.3947903947903948,
"grad_norm": 0.9844297761113842,
"learning_rate": 2.2485481997677125e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14072856307029724,
"step": 485,
"valid_targets_mean": 1727.9,
"valid_targets_min": 851
},
{
"epoch": 0.39886039886039887,
"grad_norm": 0.9685951678785188,
"learning_rate": 2.2717770034843208e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13506445288658142,
"step": 490,
"valid_targets_mean": 1643.2,
"valid_targets_min": 907
},
{
"epoch": 0.40293040293040294,
"grad_norm": 1.0189730102784529,
"learning_rate": 2.295005807200929e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11292707920074463,
"step": 495,
"valid_targets_mean": 1478.5,
"valid_targets_min": 764
},
{
"epoch": 0.407000407000407,
"grad_norm": 0.8788626334372063,
"learning_rate": 2.318234610917538e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11425843089818954,
"step": 500,
"valid_targets_mean": 1522.6,
"valid_targets_min": 822
},
{
"epoch": 0.4110704110704111,
"grad_norm": 0.966805238471609,
"learning_rate": 2.3414634146341463e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12144134938716888,
"step": 505,
"valid_targets_mean": 1589.0,
"valid_targets_min": 982
},
{
"epoch": 0.41514041514041516,
"grad_norm": 0.9177681985342081,
"learning_rate": 2.3646922183507553e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12525641918182373,
"step": 510,
"valid_targets_mean": 1574.8,
"valid_targets_min": 816
},
{
"epoch": 0.4192104192104192,
"grad_norm": 1.0766725696353001,
"learning_rate": 2.3879210220673635e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12393151223659515,
"step": 515,
"valid_targets_mean": 1422.0,
"valid_targets_min": 721
},
{
"epoch": 0.42328042328042326,
"grad_norm": 1.2191089483428443,
"learning_rate": 2.4111498257839725e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09133152663707733,
"step": 520,
"valid_targets_mean": 1150.6,
"valid_targets_min": 741
},
{
"epoch": 0.42735042735042733,
"grad_norm": 0.9898911682614888,
"learning_rate": 2.4343786295005808e-05,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13438482582569122,
"step": 525,
"valid_targets_mean": 1684.2,
"valid_targets_min": 734
},
{
"epoch": 0.4314204314204314,
"grad_norm": 1.260093754517711,
"learning_rate": 2.4576074332171894e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14740093052387238,
"step": 530,
"valid_targets_mean": 1937.1,
"valid_targets_min": 744
},
{
"epoch": 0.4354904354904355,
"grad_norm": 0.9354629606274133,
"learning_rate": 2.480836236933798e-05,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13996005058288574,
"step": 535,
"valid_targets_mean": 1842.2,
"valid_targets_min": 620
},
{
"epoch": 0.43956043956043955,
"grad_norm": 0.9747857839014156,
"learning_rate": 2.5040650406504066e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14165043830871582,
"step": 540,
"valid_targets_mean": 1637.6,
"valid_targets_min": 785
},
{
"epoch": 0.4436304436304436,
"grad_norm": 0.9131689808991684,
"learning_rate": 2.5272938443670153e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12118691951036453,
"step": 545,
"valid_targets_mean": 1969.9,
"valid_targets_min": 740
},
{
"epoch": 0.4477004477004477,
"grad_norm": 1.119476251101989,
"learning_rate": 2.550522648083624e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11075526475906372,
"step": 550,
"valid_targets_mean": 1432.1,
"valid_targets_min": 711
},
{
"epoch": 0.4517704517704518,
"grad_norm": 0.9872821443353325,
"learning_rate": 2.5737514518002325e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1334969699382782,
"step": 555,
"valid_targets_mean": 1695.6,
"valid_targets_min": 1122
},
{
"epoch": 0.45584045584045585,
"grad_norm": 1.1068786822143657,
"learning_rate": 2.596980255516841e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12975133955478668,
"step": 560,
"valid_targets_mean": 1524.5,
"valid_targets_min": 722
},
{
"epoch": 0.4599104599104599,
"grad_norm": 1.006903711549231,
"learning_rate": 2.6202090592334494e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10383662581443787,
"step": 565,
"valid_targets_mean": 1289.2,
"valid_targets_min": 661
},
{
"epoch": 0.463980463980464,
"grad_norm": 1.0929411309492179,
"learning_rate": 2.6434378629500584e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11088858544826508,
"step": 570,
"valid_targets_mean": 1519.5,
"valid_targets_min": 1011
},
{
"epoch": 0.46805046805046807,
"grad_norm": 1.038541955016419,
"learning_rate": 2.6666666666666667e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12774452567100525,
"step": 575,
"valid_targets_mean": 1731.4,
"valid_targets_min": 1277
},
{
"epoch": 0.47212047212047215,
"grad_norm": 1.012572853810221,
"learning_rate": 2.6898954703832756e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12323933839797974,
"step": 580,
"valid_targets_mean": 1486.1,
"valid_targets_min": 807
},
{
"epoch": 0.47619047619047616,
"grad_norm": 0.9487437622651357,
"learning_rate": 2.713124274099884e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13745994865894318,
"step": 585,
"valid_targets_mean": 1549.9,
"valid_targets_min": 679
},
{
"epoch": 0.48026048026048024,
"grad_norm": 0.9664417051166028,
"learning_rate": 2.736353077816493e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11426427215337753,
"step": 590,
"valid_targets_mean": 1656.0,
"valid_targets_min": 1294
},
{
"epoch": 0.4843304843304843,
"grad_norm": 0.9917889070000425,
"learning_rate": 2.759581881533101e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.108737051486969,
"step": 595,
"valid_targets_mean": 1368.8,
"valid_targets_min": 790
},
{
"epoch": 0.4884004884004884,
"grad_norm": 0.9927611626798195,
"learning_rate": 2.7828106852497098e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1328611820936203,
"step": 600,
"valid_targets_mean": 1765.8,
"valid_targets_min": 592
},
{
"epoch": 0.49247049247049246,
"grad_norm": 0.9537846739982789,
"learning_rate": 2.8060394889663184e-05,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12659400701522827,
"step": 605,
"valid_targets_mean": 1586.8,
"valid_targets_min": 662
},
{
"epoch": 0.49654049654049653,
"grad_norm": 1.0425594316679838,
"learning_rate": 2.829268292682927e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11810390651226044,
"step": 610,
"valid_targets_mean": 1336.9,
"valid_targets_min": 622
},
{
"epoch": 0.5006105006105006,
"grad_norm": 0.9994638757290513,
"learning_rate": 2.8524970963995356e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07577566802501678,
"step": 615,
"valid_targets_mean": 1097.1,
"valid_targets_min": 625
},
{
"epoch": 0.5046805046805046,
"grad_norm": 0.9987546354296077,
"learning_rate": 2.8757259001161443e-05,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.095686174929142,
"step": 620,
"valid_targets_mean": 1484.9,
"valid_targets_min": 888
},
{
"epoch": 0.5087505087505088,
"grad_norm": 0.9799026275534664,
"learning_rate": 2.898954703832753e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12912192940711975,
"step": 625,
"valid_targets_mean": 1757.0,
"valid_targets_min": 635
},
{
"epoch": 0.5128205128205128,
"grad_norm": 1.1131113884891992,
"learning_rate": 2.9221835075493615e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408751755952835,
"step": 630,
"valid_targets_mean": 1476.1,
"valid_targets_min": 522
},
{
"epoch": 0.5168905168905169,
"grad_norm": 1.380784458630799,
"learning_rate": 2.9454123112659698e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10641973465681076,
"step": 635,
"valid_targets_mean": 1230.9,
"valid_targets_min": 697
},
{
"epoch": 0.5209605209605209,
"grad_norm": 0.9088580356736188,
"learning_rate": 2.9686411149825787e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12748828530311584,
"step": 640,
"valid_targets_mean": 1671.0,
"valid_targets_min": 1010
},
{
"epoch": 0.525030525030525,
"grad_norm": 1.164121895920127,
"learning_rate": 2.991869918699187e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11815395206212997,
"step": 645,
"valid_targets_mean": 1411.0,
"valid_targets_min": 769
},
{
"epoch": 0.5291005291005291,
"grad_norm": 0.8907723008997975,
"learning_rate": 3.015098722415796e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10028189420700073,
"step": 650,
"valid_targets_mean": 1298.6,
"valid_targets_min": 745
},
{
"epoch": 0.5331705331705332,
"grad_norm": 1.0360817268903895,
"learning_rate": 3.0383275261324043e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10057306289672852,
"step": 655,
"valid_targets_mean": 1118.9,
"valid_targets_min": 680
},
{
"epoch": 0.5372405372405372,
"grad_norm": 1.0170055972555234,
"learning_rate": 3.061556329849013e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1395065188407898,
"step": 660,
"valid_targets_mean": 1905.9,
"valid_targets_min": 1347
},
{
"epoch": 0.5413105413105413,
"grad_norm": 0.9835868888525366,
"learning_rate": 3.084785133565622e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1703340709209442,
"step": 665,
"valid_targets_mean": 1636.0,
"valid_targets_min": 851
},
{
"epoch": 0.5453805453805454,
"grad_norm": 1.140427074478225,
"learning_rate": 3.10801393728223e-05,
"loss": 0.2303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10298797488212585,
"step": 670,
"valid_targets_mean": 1457.2,
"valid_targets_min": 903
},
{
"epoch": 0.5494505494505495,
"grad_norm": 0.9191202259828434,
"learning_rate": 3.131242740998839e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12798643112182617,
"step": 675,
"valid_targets_mean": 1674.4,
"valid_targets_min": 1240
},
{
"epoch": 0.5535205535205535,
"grad_norm": 0.7293467596139723,
"learning_rate": 3.154471544715447e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09391629695892334,
"step": 680,
"valid_targets_mean": 1697.1,
"valid_targets_min": 917
},
{
"epoch": 0.5575905575905576,
"grad_norm": 0.904279770364778,
"learning_rate": 3.177700348432056e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09674836695194244,
"step": 685,
"valid_targets_mean": 1580.9,
"valid_targets_min": 930
},
{
"epoch": 0.5616605616605617,
"grad_norm": 0.914638142832871,
"learning_rate": 3.200929152148664e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12186380475759506,
"step": 690,
"valid_targets_mean": 1655.1,
"valid_targets_min": 1227
},
{
"epoch": 0.5657305657305657,
"grad_norm": 0.980002165464352,
"learning_rate": 3.2241579558652736e-05,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11551667749881744,
"step": 695,
"valid_targets_mean": 1565.8,
"valid_targets_min": 870
},
{
"epoch": 0.5698005698005698,
"grad_norm": 1.0160528027914253,
"learning_rate": 3.2473867595818815e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11251623183488846,
"step": 700,
"valid_targets_mean": 1564.6,
"valid_targets_min": 822
},
{
"epoch": 0.5738705738705738,
"grad_norm": 0.874400875096317,
"learning_rate": 3.270615563298491e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10493709146976471,
"step": 705,
"valid_targets_mean": 1540.5,
"valid_targets_min": 1214
},
{
"epoch": 0.577940577940578,
"grad_norm": 1.0055632341013279,
"learning_rate": 3.293844367015099e-05,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10630016028881073,
"step": 710,
"valid_targets_mean": 1268.6,
"valid_targets_min": 591
},
{
"epoch": 0.582010582010582,
"grad_norm": 0.9150089746862734,
"learning_rate": 3.3170731707317074e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08800828456878662,
"step": 715,
"valid_targets_mean": 1232.5,
"valid_targets_min": 646
},
{
"epoch": 0.5860805860805861,
"grad_norm": 1.0300200490056817,
"learning_rate": 3.340301974448316e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12390526384115219,
"step": 720,
"valid_targets_mean": 3032.8,
"valid_targets_min": 2115
},
{
"epoch": 0.5901505901505901,
"grad_norm": 0.7910194368969308,
"learning_rate": 3.3635307781649246e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10102251172065735,
"step": 725,
"valid_targets_mean": 2553.1,
"valid_targets_min": 324
},
{
"epoch": 0.5942205942205943,
"grad_norm": 0.6300733315613507,
"learning_rate": 3.386759581881533e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08729104697704315,
"step": 730,
"valid_targets_mean": 2212.5,
"valid_targets_min": 982
},
{
"epoch": 0.5982905982905983,
"grad_norm": 0.5343519490234325,
"learning_rate": 3.409988385598142e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09156970679759979,
"step": 735,
"valid_targets_mean": 3619.4,
"valid_targets_min": 2479
},
{
"epoch": 0.6023606023606024,
"grad_norm": 0.5149220005414784,
"learning_rate": 3.4332171893147505e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058362703770399094,
"step": 740,
"valid_targets_mean": 3030.5,
"valid_targets_min": 811
},
{
"epoch": 0.6064306064306064,
"grad_norm": 0.548518746299089,
"learning_rate": 3.456445993031359e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08780361711978912,
"step": 745,
"valid_targets_mean": 2922.1,
"valid_targets_min": 1431
},
{
"epoch": 0.6105006105006106,
"grad_norm": 0.9179436846133354,
"learning_rate": 3.479674796747968e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17820069193840027,
"step": 750,
"valid_targets_mean": 1991.0,
"valid_targets_min": 703
},
{
"epoch": 0.6145706145706146,
"grad_norm": 0.49726406345055274,
"learning_rate": 3.5029036004645764e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0863165408372879,
"step": 755,
"valid_targets_mean": 3251.1,
"valid_targets_min": 621
},
{
"epoch": 0.6186406186406186,
"grad_norm": 0.5932447846887592,
"learning_rate": 3.526132404181185e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08991111069917679,
"step": 760,
"valid_targets_mean": 2681.1,
"valid_targets_min": 846
},
{
"epoch": 0.6227106227106227,
"grad_norm": 0.6378496859580239,
"learning_rate": 3.5493612078977936e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10263900458812714,
"step": 765,
"valid_targets_mean": 3618.6,
"valid_targets_min": 1369
},
{
"epoch": 0.6267806267806267,
"grad_norm": 0.48515918366222455,
"learning_rate": 3.572590011614402e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07100746035575867,
"step": 770,
"valid_targets_mean": 2980.5,
"valid_targets_min": 754
},
{
"epoch": 0.6308506308506309,
"grad_norm": 0.5735235317908716,
"learning_rate": 3.595818815331011e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08798329532146454,
"step": 775,
"valid_targets_mean": 2610.8,
"valid_targets_min": 776
},
{
"epoch": 0.6349206349206349,
"grad_norm": 0.456776675223125,
"learning_rate": 3.6190476190476195e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07948589324951172,
"step": 780,
"valid_targets_mean": 3132.1,
"valid_targets_min": 754
},
{
"epoch": 0.638990638990639,
"grad_norm": 0.9011326371623981,
"learning_rate": 3.642276422764228e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2592279314994812,
"step": 785,
"valid_targets_mean": 2020.8,
"valid_targets_min": 664
},
{
"epoch": 0.643060643060643,
"grad_norm": 0.4732929096663725,
"learning_rate": 3.665505226480837e-05,
"loss": 0.1367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0800432413816452,
"step": 790,
"valid_targets_mean": 3713.8,
"valid_targets_min": 2542
},
{
"epoch": 0.6471306471306472,
"grad_norm": 0.526624007045652,
"learning_rate": 3.688734030197445e-05,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09772545099258423,
"step": 795,
"valid_targets_mean": 3191.9,
"valid_targets_min": 1462
},
{
"epoch": 0.6512006512006512,
"grad_norm": 0.559506972012892,
"learning_rate": 3.711962833914054e-05,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09087392687797546,
"step": 800,
"valid_targets_mean": 3721.0,
"valid_targets_min": 3281
},
{
"epoch": 0.6552706552706553,
"grad_norm": 0.556479447905555,
"learning_rate": 3.7351916376306626e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07183747738599777,
"step": 805,
"valid_targets_mean": 3360.4,
"valid_targets_min": 2189
},
{
"epoch": 0.6593406593406593,
"grad_norm": 0.47771197862438014,
"learning_rate": 3.758420441347271e-05,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06540735065937042,
"step": 810,
"valid_targets_mean": 3223.9,
"valid_targets_min": 1590
},
{
"epoch": 0.6634106634106635,
"grad_norm": 0.6194871689055971,
"learning_rate": 3.78164924506388e-05,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09501364827156067,
"step": 815,
"valid_targets_mean": 2352.1,
"valid_targets_min": 597
},
{
"epoch": 0.6674806674806675,
"grad_norm": 0.5709548511328791,
"learning_rate": 3.804878048780488e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07070401310920715,
"step": 820,
"valid_targets_mean": 2612.9,
"valid_targets_min": 701
},
{
"epoch": 0.6715506715506715,
"grad_norm": 0.6298911863782369,
"learning_rate": 3.828106852497097e-05,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13569210469722748,
"step": 825,
"valid_targets_mean": 2791.8,
"valid_targets_min": 1652
},
{
"epoch": 0.6756206756206756,
"grad_norm": 0.41285244882235234,
"learning_rate": 3.851335656213705e-05,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06671032309532166,
"step": 830,
"valid_targets_mean": 3704.5,
"valid_targets_min": 1908
},
{
"epoch": 0.6796906796906796,
"grad_norm": 0.5540522932015873,
"learning_rate": 3.874564459930314e-05,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05759810283780098,
"step": 835,
"valid_targets_mean": 3204.0,
"valid_targets_min": 842
},
{
"epoch": 0.6837606837606838,
"grad_norm": 0.5067086140456947,
"learning_rate": 3.897793263646922e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07755052298307419,
"step": 840,
"valid_targets_mean": 3402.9,
"valid_targets_min": 2552
},
{
"epoch": 0.6878306878306878,
"grad_norm": 0.4997196495634557,
"learning_rate": 3.9210220673635316e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06302007287740707,
"step": 845,
"valid_targets_mean": 2979.9,
"valid_targets_min": 753
},
{
"epoch": 0.6919006919006919,
"grad_norm": 0.6481848237866301,
"learning_rate": 3.9442508710801395e-05,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08520719408988953,
"step": 850,
"valid_targets_mean": 1296.9,
"valid_targets_min": 568
},
{
"epoch": 0.6959706959706959,
"grad_norm": 0.6442175252045691,
"learning_rate": 3.967479674796748e-05,
"loss": 0.3765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15752309560775757,
"step": 855,
"valid_targets_mean": 3126.9,
"valid_targets_min": 1070
},
{
"epoch": 0.7000407000407001,
"grad_norm": 0.6674141205524147,
"learning_rate": 3.990708478513357e-05,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07941246777772903,
"step": 860,
"valid_targets_mean": 2456.6,
"valid_targets_min": 329
},
{
"epoch": 0.7041107041107041,
"grad_norm": 0.9275941441191697,
"learning_rate": 3.999998518042097e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09268821775913239,
"step": 865,
"valid_targets_mean": 1027.8,
"valid_targets_min": 608
},
{
"epoch": 0.7081807081807082,
"grad_norm": 0.5285806533784231,
"learning_rate": 3.99998946164064e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09387123584747314,
"step": 870,
"valid_targets_mean": 4479.8,
"valid_targets_min": 2772
},
{
"epoch": 0.7122507122507122,
"grad_norm": 0.37957034276853,
"learning_rate": 3.99997217218491e-05,
"loss": 0.1232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03582998737692833,
"step": 875,
"valid_targets_mean": 4843.0,
"valid_targets_min": 3778
},
{
"epoch": 0.7163207163207164,
"grad_norm": 0.41394530709191624,
"learning_rate": 3.999946649746077e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07335696369409561,
"step": 880,
"valid_targets_mean": 4306.0,
"valid_targets_min": 2336
},
{
"epoch": 0.7203907203907204,
"grad_norm": 0.4646047347434619,
"learning_rate": 3.999912894429209e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09124352037906647,
"step": 885,
"valid_targets_mean": 3579.5,
"valid_targets_min": 846
},
{
"epoch": 0.7244607244607245,
"grad_norm": 0.44725991333845716,
"learning_rate": 3.999870906373257e-05,
"loss": 0.136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07628832757472992,
"step": 890,
"valid_targets_mean": 2909.1,
"valid_targets_min": 798
},
{
"epoch": 0.7285307285307285,
"grad_norm": 0.5172719098407891,
"learning_rate": 3.999820685751071e-05,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057969748973846436,
"step": 895,
"valid_targets_mean": 2008.5,
"valid_targets_min": 533
},
{
"epoch": 0.7326007326007326,
"grad_norm": 0.5824331819625881,
"learning_rate": 3.9997622327693844e-05,
"loss": 0.1338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06565313041210175,
"step": 900,
"valid_targets_mean": 2598.2,
"valid_targets_min": 833
},
{
"epoch": 0.7366707366707367,
"grad_norm": 0.3535344374037899,
"learning_rate": 3.999695547668823e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06244448944926262,
"step": 905,
"valid_targets_mean": 4031.8,
"valid_targets_min": 3391
},
{
"epoch": 0.7407407407407407,
"grad_norm": 0.6239344756497878,
"learning_rate": 3.9996206307238974e-05,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15695582330226898,
"step": 910,
"valid_targets_mean": 1909.9,
"valid_targets_min": 732
},
{
"epoch": 0.7448107448107448,
"grad_norm": 0.5990548788322103,
"learning_rate": 3.9995374822430085e-05,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06945429742336273,
"step": 915,
"valid_targets_mean": 1908.9,
"valid_targets_min": 538
},
{
"epoch": 0.7488807488807488,
"grad_norm": 0.7675363094142649,
"learning_rate": 3.999446102568441e-05,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06405394524335861,
"step": 920,
"valid_targets_mean": 824.9,
"valid_targets_min": 720
},
{
"epoch": 0.752950752950753,
"grad_norm": 0.485700948966615,
"learning_rate": 3.9993464920763625e-05,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059826068580150604,
"step": 925,
"valid_targets_mean": 3181.1,
"valid_targets_min": 2328
},
{
"epoch": 0.757020757020757,
"grad_norm": 0.5240818086557136,
"learning_rate": 3.9992386511768256e-05,
"loss": 0.1205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0472230464220047,
"step": 930,
"valid_targets_mean": 2581.4,
"valid_targets_min": 684
},
{
"epoch": 0.7610907610907611,
"grad_norm": 0.45360997168418743,
"learning_rate": 3.999122580313763e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06742153316736221,
"step": 935,
"valid_targets_mean": 3461.2,
"valid_targets_min": 2795
},
{
"epoch": 0.7651607651607651,
"grad_norm": 0.44183845519885645,
"learning_rate": 3.998998279964985e-05,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06665977835655212,
"step": 940,
"valid_targets_mean": 3382.6,
"valid_targets_min": 744
},
{
"epoch": 0.7692307692307693,
"grad_norm": 0.3888042558436287,
"learning_rate": 3.99886575064218e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04930161312222481,
"step": 945,
"valid_targets_mean": 3966.6,
"valid_targets_min": 3279
},
{
"epoch": 0.7733007733007733,
"grad_norm": 0.781091504085825,
"learning_rate": 3.9987249928909134e-05,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06562864780426025,
"step": 950,
"valid_targets_mean": 792.1,
"valid_targets_min": 536
},
{
"epoch": 0.7773707773707774,
"grad_norm": 0.5459088120181143,
"learning_rate": 3.998576007290619e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07265473157167435,
"step": 955,
"valid_targets_mean": 2227.4,
"valid_targets_min": 853
},
{
"epoch": 0.7814407814407814,
"grad_norm": 0.5220107941150061,
"learning_rate": 3.998418794454604e-05,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06951494514942169,
"step": 960,
"valid_targets_mean": 3105.6,
"valid_targets_min": 2621
},
{
"epoch": 0.7855107855107855,
"grad_norm": 0.8069948423800993,
"learning_rate": 3.998253355030043e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08019239455461502,
"step": 965,
"valid_targets_mean": 1028.0,
"valid_targets_min": 728
},
{
"epoch": 0.7895807895807896,
"grad_norm": 0.7429706122743682,
"learning_rate": 3.9980796896979754e-05,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08751674741506577,
"step": 970,
"valid_targets_mean": 1574.2,
"valid_targets_min": 618
},
{
"epoch": 0.7936507936507936,
"grad_norm": 0.39203442846152786,
"learning_rate": 3.997897799173304e-05,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08704735338687897,
"step": 975,
"valid_targets_mean": 4135.0,
"valid_targets_min": 907
},
{
"epoch": 0.7977207977207977,
"grad_norm": 0.5960348844477907,
"learning_rate": 3.9977076842047875e-05,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11054828017950058,
"step": 980,
"valid_targets_mean": 3060.8,
"valid_targets_min": 580
},
{
"epoch": 0.8017908017908018,
"grad_norm": 0.4111968138383219,
"learning_rate": 3.997509345575045e-05,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05692315846681595,
"step": 985,
"valid_targets_mean": 3413.8,
"valid_targets_min": 726
},
{
"epoch": 0.8058608058608059,
"grad_norm": 0.4256293187737857,
"learning_rate": 3.997302784100548e-05,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07128673046827316,
"step": 990,
"valid_targets_mean": 4560.9,
"valid_targets_min": 2613
},
{
"epoch": 0.8099308099308099,
"grad_norm": 0.5345662568540609,
"learning_rate": 3.9970880006316154e-05,
"loss": 0.13,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08130151033401489,
"step": 995,
"valid_targets_mean": 2847.2,
"valid_targets_min": 531
},
{
"epoch": 0.814000814000814,
"grad_norm": 0.4593774947539876,
"learning_rate": 3.996864996052416e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06226513907313347,
"step": 1000,
"valid_targets_mean": 2571.5,
"valid_targets_min": 826
},
{
"epoch": 0.818070818070818,
"grad_norm": 0.4128348658429294,
"learning_rate": 3.996633771280956e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05955663323402405,
"step": 1005,
"valid_targets_mean": 3709.6,
"valid_targets_min": 3024
},
{
"epoch": 0.8221408221408222,
"grad_norm": 0.4342247430230778,
"learning_rate": 3.996394327269085e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07043300569057465,
"step": 1010,
"valid_targets_mean": 3559.0,
"valid_targets_min": 2588
},
{
"epoch": 0.8262108262108262,
"grad_norm": 0.6288265395421371,
"learning_rate": 3.996146665002486e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08794619888067245,
"step": 1015,
"valid_targets_mean": 913.9,
"valid_targets_min": 502
},
{
"epoch": 0.8302808302808303,
"grad_norm": 0.42302660971720984,
"learning_rate": 3.995890785500673e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061350464820861816,
"step": 1020,
"valid_targets_mean": 3301.9,
"valid_targets_min": 1158
},
{
"epoch": 0.8343508343508343,
"grad_norm": 0.3202899133836535,
"learning_rate": 3.995626689816986e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05292180925607681,
"step": 1025,
"valid_targets_mean": 3874.9,
"valid_targets_min": 3044
},
{
"epoch": 0.8384208384208384,
"grad_norm": 0.4395087698128267,
"learning_rate": 3.9953543790385885e-05,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06124342978000641,
"step": 1030,
"valid_targets_mean": 2167.8,
"valid_targets_min": 539
},
{
"epoch": 0.8424908424908425,
"grad_norm": 0.45572335142795467,
"learning_rate": 3.99507385428646e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0583365373313427,
"step": 1035,
"valid_targets_mean": 2397.0,
"valid_targets_min": 387
},
{
"epoch": 0.8465608465608465,
"grad_norm": 0.6042755009543974,
"learning_rate": 3.994785116715395e-05,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08790750801563263,
"step": 1040,
"valid_targets_mean": 2340.9,
"valid_targets_min": 872
},
{
"epoch": 0.8506308506308506,
"grad_norm": 0.4360163793065081,
"learning_rate": 3.9944881675139956e-05,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052534107118844986,
"step": 1045,
"valid_targets_mean": 3017.2,
"valid_targets_min": 822
},
{
"epoch": 0.8547008547008547,
"grad_norm": 0.7915374414247746,
"learning_rate": 3.9941830079046686e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10059764981269836,
"step": 1050,
"valid_targets_mean": 1405.9,
"valid_targets_min": 605
},
{
"epoch": 0.8587708587708588,
"grad_norm": 0.5768502808481547,
"learning_rate": 3.9938696391436165e-05,
"loss": 0.1304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08434294909238815,
"step": 1055,
"valid_targets_mean": 2249.2,
"valid_targets_min": 808
},
{
"epoch": 0.8628408628408628,
"grad_norm": 0.44611255063891225,
"learning_rate": 3.993548062520839e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06437411904335022,
"step": 1060,
"valid_targets_mean": 2900.5,
"valid_targets_min": 1010
},
{
"epoch": 0.8669108669108669,
"grad_norm": 0.40352294092211805,
"learning_rate": 3.9932182793601216e-05,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047206662595272064,
"step": 1065,
"valid_targets_mean": 2432.6,
"valid_targets_min": 524
},
{
"epoch": 0.870980870980871,
"grad_norm": 0.48655652159394597,
"learning_rate": 3.992880291019032e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04721086844801903,
"step": 1070,
"valid_targets_mean": 1303.5,
"valid_targets_min": 516
},
{
"epoch": 0.8750508750508751,
"grad_norm": 0.5368186314445392,
"learning_rate": 3.992534098888916e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06309214979410172,
"step": 1075,
"valid_targets_mean": 1762.1,
"valid_targets_min": 342
},
{
"epoch": 0.8791208791208791,
"grad_norm": 0.3615301144651535,
"learning_rate": 3.992179704394891e-05,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061992619186639786,
"step": 1080,
"valid_targets_mean": 3301.8,
"valid_targets_min": 1440
},
{
"epoch": 0.8831908831908832,
"grad_norm": 0.47684964360761173,
"learning_rate": 3.991817108995838e-05,
"loss": 0.1145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053332049399614334,
"step": 1085,
"valid_targets_mean": 2274.2,
"valid_targets_min": 708
},
{
"epoch": 0.8872608872608873,
"grad_norm": 0.3277156842140217,
"learning_rate": 3.9914463141844e-05,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058171793818473816,
"step": 1090,
"valid_targets_mean": 5103.1,
"valid_targets_min": 3653
},
{
"epoch": 0.8913308913308914,
"grad_norm": 0.37913532995319227,
"learning_rate": 3.991067321486971e-05,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04157901927828789,
"step": 1095,
"valid_targets_mean": 2366.5,
"valid_targets_min": 684
},
{
"epoch": 0.8954008954008954,
"grad_norm": 0.44728273843652605,
"learning_rate": 3.990680132463694e-05,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06624357402324677,
"step": 1100,
"valid_targets_mean": 3352.1,
"valid_targets_min": 726
},
{
"epoch": 0.8994708994708994,
"grad_norm": 0.3699276991369879,
"learning_rate": 3.99028474870845e-05,
"loss": 0.1372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06432875990867615,
"step": 1105,
"valid_targets_mean": 4009.6,
"valid_targets_min": 3076
},
{
"epoch": 0.9035409035409036,
"grad_norm": 0.559438917402308,
"learning_rate": 3.989881171848857e-05,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19042916595935822,
"step": 1110,
"valid_targets_mean": 2811.9,
"valid_targets_min": 1536
},
{
"epoch": 0.9076109076109076,
"grad_norm": 0.4455049575824879,
"learning_rate": 3.989469403546258e-05,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07045942544937134,
"step": 1115,
"valid_targets_mean": 2669.4,
"valid_targets_min": 582
},
{
"epoch": 0.9116809116809117,
"grad_norm": 0.35606075856961944,
"learning_rate": 3.989049445495718e-05,
"loss": 0.1334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05114404112100601,
"step": 1120,
"valid_targets_mean": 3261.9,
"valid_targets_min": 633
},
{
"epoch": 0.9157509157509157,
"grad_norm": 0.37757857329286704,
"learning_rate": 3.9886212994260146e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04709208756685257,
"step": 1125,
"valid_targets_mean": 3287.2,
"valid_targets_min": 1130
},
{
"epoch": 0.9198209198209198,
"grad_norm": 0.40732084354821907,
"learning_rate": 3.98818496709963e-05,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06523814797401428,
"step": 1130,
"valid_targets_mean": 2858.9,
"valid_targets_min": 492
},
{
"epoch": 0.9238909238909239,
"grad_norm": 0.7103621320340062,
"learning_rate": 3.987740450312751e-05,
"loss": 0.1378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08393198251724243,
"step": 1135,
"valid_targets_mean": 2531.5,
"valid_targets_min": 1045
},
{
"epoch": 0.927960927960928,
"grad_norm": 0.38515151498760647,
"learning_rate": 3.9872877508952506e-05,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04183115065097809,
"step": 1140,
"valid_targets_mean": 2692.0,
"valid_targets_min": 647
},
{
"epoch": 0.932030932030932,
"grad_norm": 0.6540079458171796,
"learning_rate": 3.9868268707106884e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13763931393623352,
"step": 1145,
"valid_targets_mean": 1831.5,
"valid_targets_min": 806
},
{
"epoch": 0.9361009361009361,
"grad_norm": 0.6012472482945602,
"learning_rate": 3.9863578116563e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06246567517518997,
"step": 1150,
"valid_targets_mean": 1300.1,
"valid_targets_min": 575
},
{
"epoch": 0.9401709401709402,
"grad_norm": 0.44241303636120555,
"learning_rate": 3.9858805756629906e-05,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057974182069301605,
"step": 1155,
"valid_targets_mean": 3615.9,
"valid_targets_min": 3193
},
{
"epoch": 0.9442409442409443,
"grad_norm": 0.3903708665427787,
"learning_rate": 3.985395164695324e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05488427355885506,
"step": 1160,
"valid_targets_mean": 3944.1,
"valid_targets_min": 3433
},
{
"epoch": 0.9483109483109483,
"grad_norm": 0.39685042835856477,
"learning_rate": 3.98490158075152e-05,
"loss": 0.1271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05394378677010536,
"step": 1165,
"valid_targets_mean": 2874.5,
"valid_targets_min": 767
},
{
"epoch": 0.9523809523809523,
"grad_norm": 0.4929139704427634,
"learning_rate": 3.9843998258634397e-05,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0530795156955719,
"step": 1170,
"valid_targets_mean": 2262.1,
"valid_targets_min": 785
},
{
"epoch": 0.9564509564509565,
"grad_norm": 0.7315882847416906,
"learning_rate": 3.983889902096582e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08292382210493088,
"step": 1175,
"valid_targets_mean": 1222.8,
"valid_targets_min": 758
},
{
"epoch": 0.9605209605209605,
"grad_norm": 0.4497078672225934,
"learning_rate": 3.9833718115500735e-05,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057786524295806885,
"step": 1180,
"valid_targets_mean": 2184.0,
"valid_targets_min": 797
},
{
"epoch": 0.9645909645909646,
"grad_norm": 0.37472458302150724,
"learning_rate": 3.9828455563566585e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058492764830589294,
"step": 1185,
"valid_targets_mean": 3445.0,
"valid_targets_min": 1606
},
{
"epoch": 0.9686609686609686,
"grad_norm": 0.49178605406882114,
"learning_rate": 3.982311138682693e-05,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07257603108882904,
"step": 1190,
"valid_targets_mean": 2760.0,
"valid_targets_min": 678
},
{
"epoch": 0.9727309727309728,
"grad_norm": 0.30926831647178493,
"learning_rate": 3.981768560728132e-05,
"loss": 0.1272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06540581583976746,
"step": 1195,
"valid_targets_mean": 5550.0,
"valid_targets_min": 3997
},
{
"epoch": 0.9768009768009768,
"grad_norm": 0.3480919181704012,
"learning_rate": 3.981217824726525e-05,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035894401371479034,
"step": 1200,
"valid_targets_mean": 2142.1,
"valid_targets_min": 706
},
{
"epoch": 0.9808709808709809,
"grad_norm": 0.6953856332846773,
"learning_rate": 3.9806589329450045e-05,
"loss": 0.1299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09473567456007004,
"step": 1205,
"valid_targets_mean": 1705.0,
"valid_targets_min": 580
},
{
"epoch": 0.9849409849409849,
"grad_norm": 0.6447718942126139,
"learning_rate": 3.980091887684274e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11416690051555634,
"step": 1210,
"valid_targets_mean": 2792.0,
"valid_targets_min": 2379
},
{
"epoch": 0.989010989010989,
"grad_norm": 0.44493565718387146,
"learning_rate": 3.979516691278605e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05794357508420944,
"step": 1215,
"valid_targets_mean": 3489.0,
"valid_targets_min": 2861
},
{
"epoch": 0.9930809930809931,
"grad_norm": 0.3554690075057992,
"learning_rate": 3.9789333460958195e-05,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06033288687467575,
"step": 1220,
"valid_targets_mean": 3850.4,
"valid_targets_min": 2453
},
{
"epoch": 0.9971509971509972,
"grad_norm": 0.39798751935774657,
"learning_rate": 3.978341854537288e-05,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06392422318458557,
"step": 1225,
"valid_targets_mean": 3932.9,
"valid_targets_min": 3389
},
{
"epoch": 1.0008140008140007,
"grad_norm": 0.5953058538336475,
"learning_rate": 3.977742219037914e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14234861731529236,
"step": 1230,
"valid_targets_mean": 8215.2,
"valid_targets_min": 6163
},
{
"epoch": 1.0048840048840049,
"grad_norm": 0.4684299696968115,
"learning_rate": 3.9771344420661265e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.144585520029068,
"step": 1235,
"valid_targets_mean": 8594.4,
"valid_targets_min": 6006
},
{
"epoch": 1.008954008954009,
"grad_norm": 0.6867925767436964,
"learning_rate": 3.9765185261238685e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1256946623325348,
"step": 1240,
"valid_targets_mean": 3578.4,
"valid_targets_min": 289
},
{
"epoch": 1.0130240130240131,
"grad_norm": 0.42999406091039816,
"learning_rate": 3.9758944737465885e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13307125866413116,
"step": 1245,
"valid_targets_mean": 7019.9,
"valid_targets_min": 4985
},
{
"epoch": 1.017094017094017,
"grad_norm": 0.43330214352879454,
"learning_rate": 3.9752622875032275e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12875577807426453,
"step": 1250,
"valid_targets_mean": 6956.6,
"valid_targets_min": 1457
},
{
"epoch": 1.0211640211640212,
"grad_norm": 0.4137992292045322,
"learning_rate": 3.974621969996213e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12030914425849915,
"step": 1255,
"valid_targets_mean": 7361.6,
"valid_targets_min": 4961
},
{
"epoch": 1.0252340252340253,
"grad_norm": 0.5022158686145597,
"learning_rate": 3.973973523861442e-05,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15889611840248108,
"step": 1260,
"valid_targets_mean": 7058.5,
"valid_targets_min": 5985
},
{
"epoch": 1.0293040293040292,
"grad_norm": 0.39049657893691275,
"learning_rate": 3.973316951768275e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14278875291347504,
"step": 1265,
"valid_targets_mean": 7664.2,
"valid_targets_min": 5169
},
{
"epoch": 1.0333740333740333,
"grad_norm": 0.42504045855242684,
"learning_rate": 3.972652256419522e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12719795107841492,
"step": 1270,
"valid_targets_mean": 7111.8,
"valid_targets_min": 5348
},
{
"epoch": 1.0374440374440375,
"grad_norm": 0.4952882040537086,
"learning_rate": 3.971979440551436e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11728663742542267,
"step": 1275,
"valid_targets_mean": 4238.9,
"valid_targets_min": 152
},
{
"epoch": 1.0415140415140416,
"grad_norm": 0.4181601879292703,
"learning_rate": 3.9712985069336955e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12817908823490143,
"step": 1280,
"valid_targets_mean": 7199.4,
"valid_targets_min": 4258
},
{
"epoch": 1.0455840455840455,
"grad_norm": 0.48722985192181184,
"learning_rate": 3.9706094583693954e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1204463317990303,
"step": 1285,
"valid_targets_mean": 7243.4,
"valid_targets_min": 5831
},
{
"epoch": 1.0496540496540496,
"grad_norm": 0.4108207703430436,
"learning_rate": 3.96991229769504e-05,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1202164739370346,
"step": 1290,
"valid_targets_mean": 6950.6,
"valid_targets_min": 3862
},
{
"epoch": 1.0537240537240538,
"grad_norm": 0.40991192760617895,
"learning_rate": 3.969207027780524e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1293250173330307,
"step": 1295,
"valid_targets_mean": 6991.9,
"valid_targets_min": 5696
},
{
"epoch": 1.0577940577940579,
"grad_norm": 0.42826333297089153,
"learning_rate": 3.968493651529126e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1293313354253769,
"step": 1300,
"valid_targets_mean": 6963.5,
"valid_targets_min": 4947
},
{
"epoch": 1.0618640618640618,
"grad_norm": 0.39443414280580313,
"learning_rate": 3.967772171877494e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11275345087051392,
"step": 1305,
"valid_targets_mean": 6436.9,
"valid_targets_min": 4988
},
{
"epoch": 1.065934065934066,
"grad_norm": 0.4373139454687315,
"learning_rate": 3.967042591795634e-05,
"loss": 0.2394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11951905488967896,
"step": 1310,
"valid_targets_mean": 7518.0,
"valid_targets_min": 5476
},
{
"epoch": 1.07000407000407,
"grad_norm": 0.38657017917234543,
"learning_rate": 3.966304914286898e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10981670022010803,
"step": 1315,
"valid_targets_mean": 7422.6,
"valid_targets_min": 5226
},
{
"epoch": 1.074074074074074,
"grad_norm": 0.46603622908971615,
"learning_rate": 3.965559142387972e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15436352789402008,
"step": 1320,
"valid_targets_mean": 7080.0,
"valid_targets_min": 3753
},
{
"epoch": 1.078144078144078,
"grad_norm": 0.5089544183960755,
"learning_rate": 3.964805279168862e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13544388115406036,
"step": 1325,
"valid_targets_mean": 6064.6,
"valid_targets_min": 5161
},
{
"epoch": 1.0822140822140822,
"grad_norm": 0.4213050484999416,
"learning_rate": 3.9640433277328824e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11462973058223724,
"step": 1330,
"valid_targets_mean": 7388.1,
"valid_targets_min": 5795
},
{
"epoch": 1.0862840862840863,
"grad_norm": 0.3819112265649167,
"learning_rate": 3.963273291216645e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10795051604509354,
"step": 1335,
"valid_targets_mean": 7696.0,
"valid_targets_min": 4658
},
{
"epoch": 1.0903540903540903,
"grad_norm": 0.4114432948340316,
"learning_rate": 3.9624951727900406e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12693330645561218,
"step": 1340,
"valid_targets_mean": 7799.1,
"valid_targets_min": 5508
},
{
"epoch": 1.0944240944240944,
"grad_norm": 0.4056233219924477,
"learning_rate": 3.9617089756562334e-05,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11809612810611725,
"step": 1345,
"valid_targets_mean": 7341.6,
"valid_targets_min": 6454
},
{
"epoch": 1.0984940984940985,
"grad_norm": 0.4188231753878829,
"learning_rate": 3.960914703051642e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10444575548171997,
"step": 1350,
"valid_targets_mean": 6818.0,
"valid_targets_min": 4392
},
{
"epoch": 1.1025641025641026,
"grad_norm": 0.3886197018701831,
"learning_rate": 3.960112358245927e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10350356996059418,
"step": 1355,
"valid_targets_mean": 7857.6,
"valid_targets_min": 5394
},
{
"epoch": 1.1066341066341066,
"grad_norm": 0.35882023777430566,
"learning_rate": 3.9593019445419814e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09432516247034073,
"step": 1360,
"valid_targets_mean": 8314.1,
"valid_targets_min": 4837
},
{
"epoch": 1.1107041107041107,
"grad_norm": 0.3392184288683715,
"learning_rate": 3.9584834652759124e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08807634562253952,
"step": 1365,
"valid_targets_mean": 7368.2,
"valid_targets_min": 6027
},
{
"epoch": 1.1147741147741148,
"grad_norm": 0.4323967342653223,
"learning_rate": 3.95765692381703e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11778441816568375,
"step": 1370,
"valid_targets_mean": 6435.0,
"valid_targets_min": 4238
},
{
"epoch": 1.118844118844119,
"grad_norm": 1.7395054695099226,
"learning_rate": 3.956822323567832e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10033954679965973,
"step": 1375,
"valid_targets_mean": 247.8,
"valid_targets_min": 137
},
{
"epoch": 1.1229141229141228,
"grad_norm": 0.42995283027411474,
"learning_rate": 3.9559796679639914e-05,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11196690052747726,
"step": 1380,
"valid_targets_mean": 6807.0,
"valid_targets_min": 5165
},
{
"epoch": 1.126984126984127,
"grad_norm": 0.4579494248210466,
"learning_rate": 3.955128960474341e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1293865293264389,
"step": 1385,
"valid_targets_mean": 6989.9,
"valid_targets_min": 5104
},
{
"epoch": 1.131054131054131,
"grad_norm": 0.41699725958422584,
"learning_rate": 3.95427020460086e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13233298063278198,
"step": 1390,
"valid_targets_mean": 6692.2,
"valid_targets_min": 5068
},
{
"epoch": 1.1351241351241352,
"grad_norm": 0.4309390492887969,
"learning_rate": 3.953403403878659e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428421139717102,
"step": 1395,
"valid_targets_mean": 7419.6,
"valid_targets_min": 5578
},
{
"epoch": 1.1391941391941391,
"grad_norm": 0.3957195172464458,
"learning_rate": 3.952528561875966e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11624685674905777,
"step": 1400,
"valid_targets_mean": 7536.5,
"valid_targets_min": 5075
},
{
"epoch": 1.1432641432641433,
"grad_norm": 0.4039821590351794,
"learning_rate": 3.951645682194109e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1071617528796196,
"step": 1405,
"valid_targets_mean": 7221.5,
"valid_targets_min": 5841
},
{
"epoch": 1.1473341473341474,
"grad_norm": 0.41845015880407643,
"learning_rate": 3.950754768467506e-05,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11402362585067749,
"step": 1410,
"valid_targets_mean": 7287.5,
"valid_targets_min": 5151
},
{
"epoch": 1.1514041514041513,
"grad_norm": 0.40797870681631443,
"learning_rate": 3.949855824363647e-05,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11144113540649414,
"step": 1415,
"valid_targets_mean": 6738.4,
"valid_targets_min": 4042
},
{
"epoch": 1.1554741554741554,
"grad_norm": 0.43409193061927426,
"learning_rate": 3.948948853583081e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12913505733013153,
"step": 1420,
"valid_targets_mean": 6331.0,
"valid_targets_min": 5496
},
{
"epoch": 1.1595441595441596,
"grad_norm": 0.43403376610064975,
"learning_rate": 3.9480338598593955e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11496134102344513,
"step": 1425,
"valid_targets_mean": 6271.1,
"valid_targets_min": 4695
},
{
"epoch": 1.1636141636141637,
"grad_norm": 0.45486378077738254,
"learning_rate": 3.947110846959207e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12110753357410431,
"step": 1430,
"valid_targets_mean": 5790.8,
"valid_targets_min": 5021
},
{
"epoch": 1.1676841676841676,
"grad_norm": 0.4865911390888994,
"learning_rate": 3.9461798186821434e-05,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09251779317855835,
"step": 1435,
"valid_targets_mean": 3386.8,
"valid_targets_min": 2279
},
{
"epoch": 1.1717541717541717,
"grad_norm": 0.45904203833658064,
"learning_rate": 3.9452407788608275e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11358363926410675,
"step": 1440,
"valid_targets_mean": 6240.5,
"valid_targets_min": 5093
},
{
"epoch": 1.1758241758241759,
"grad_norm": 0.46020651070927404,
"learning_rate": 3.9442937313608646e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11856567859649658,
"step": 1445,
"valid_targets_mean": 6329.5,
"valid_targets_min": 4589
},
{
"epoch": 1.17989417989418,
"grad_norm": 0.3983320494029986,
"learning_rate": 3.94333868008082e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12220582365989685,
"step": 1450,
"valid_targets_mean": 7589.2,
"valid_targets_min": 4963
},
{
"epoch": 1.183964183964184,
"grad_norm": 0.4581307530062702,
"learning_rate": 3.94237562895221e-05,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09797120094299316,
"step": 1455,
"valid_targets_mean": 5577.9,
"valid_targets_min": 4458
},
{
"epoch": 1.188034188034188,
"grad_norm": 0.5075652321634042,
"learning_rate": 3.941404581939481e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10852977633476257,
"step": 1460,
"valid_targets_mean": 5432.5,
"valid_targets_min": 4433
},
{
"epoch": 1.1921041921041922,
"grad_norm": 0.6232838095901682,
"learning_rate": 3.940425543039996e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11723101139068604,
"step": 1465,
"valid_targets_mean": 6361.8,
"valid_targets_min": 5201
},
{
"epoch": 1.196174196174196,
"grad_norm": 0.42438428970084924,
"learning_rate": 3.939438516284015e-05,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10583050549030304,
"step": 1470,
"valid_targets_mean": 5824.4,
"valid_targets_min": 5129
},
{
"epoch": 1.2002442002442002,
"grad_norm": 0.8552840375409755,
"learning_rate": 3.938443505734684e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1607503890991211,
"step": 1475,
"valid_targets_mean": 1637.6,
"valid_targets_min": 137
},
{
"epoch": 1.2043142043142043,
"grad_norm": 0.4282729691315241,
"learning_rate": 3.9374405154880104e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11325763911008835,
"step": 1480,
"valid_targets_mean": 6474.6,
"valid_targets_min": 4751
},
{
"epoch": 1.2083842083842085,
"grad_norm": 0.45919849824696074,
"learning_rate": 3.9364295496728545e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1222546175122261,
"step": 1485,
"valid_targets_mean": 7186.2,
"valid_targets_min": 5358
},
{
"epoch": 1.2124542124542124,
"grad_norm": 0.41905751280920195,
"learning_rate": 3.9354106124509045e-05,
"loss": 0.2288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11492247879505157,
"step": 1490,
"valid_targets_mean": 7126.8,
"valid_targets_min": 4078
},
{
"epoch": 1.2165242165242165,
"grad_norm": 0.4228687168767464,
"learning_rate": 3.934383708016667e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11097435653209686,
"step": 1495,
"valid_targets_mean": 7022.1,
"valid_targets_min": 4940
},
{
"epoch": 1.2205942205942206,
"grad_norm": 0.42085225391276915,
"learning_rate": 3.9333488405974434e-05,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11520600318908691,
"step": 1500,
"valid_targets_mean": 5900.6,
"valid_targets_min": 4779
},
{
"epoch": 1.2246642246642248,
"grad_norm": 0.4633839046298897,
"learning_rate": 3.932306014453315e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11590239405632019,
"step": 1505,
"valid_targets_mean": 6290.1,
"valid_targets_min": 4620
},
{
"epoch": 1.2287342287342287,
"grad_norm": 0.9660012618752344,
"learning_rate": 3.9312552338771284e-05,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10209794342517853,
"step": 1510,
"valid_targets_mean": 1162.2,
"valid_targets_min": 788
},
{
"epoch": 1.2328042328042328,
"grad_norm": 0.8959866942571094,
"learning_rate": 3.9301965031944724e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11823749542236328,
"step": 1515,
"valid_targets_mean": 1500.6,
"valid_targets_min": 957
},
{
"epoch": 1.236874236874237,
"grad_norm": 0.92051115161302,
"learning_rate": 3.929129826763663e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11000481992959976,
"step": 1520,
"valid_targets_mean": 1371.2,
"valid_targets_min": 796
},
{
"epoch": 1.2409442409442408,
"grad_norm": 0.8905552213698138,
"learning_rate": 3.928055208975726e-05,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13280996680259705,
"step": 1525,
"valid_targets_mean": 1433.6,
"valid_targets_min": 697
},
{
"epoch": 1.245014245014245,
"grad_norm": 0.7573822137035331,
"learning_rate": 3.926972654254379e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10896831750869751,
"step": 1530,
"valid_targets_mean": 1578.9,
"valid_targets_min": 638
},
{
"epoch": 1.249084249084249,
"grad_norm": 0.7786863011930503,
"learning_rate": 3.92588216705601e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11522305011749268,
"step": 1535,
"valid_targets_mean": 1746.4,
"valid_targets_min": 727
},
{
"epoch": 1.2531542531542532,
"grad_norm": 0.7938573989349429,
"learning_rate": 3.924783751869663e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09873868525028229,
"step": 1540,
"valid_targets_mean": 1309.9,
"valid_targets_min": 761
},
{
"epoch": 1.2572242572242573,
"grad_norm": 0.9426871570045071,
"learning_rate": 3.923677413217019e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13097123801708221,
"step": 1545,
"valid_targets_mean": 1368.6,
"valid_targets_min": 714
},
{
"epoch": 1.2612942612942613,
"grad_norm": 0.8036694210964767,
"learning_rate": 3.9225631556523744e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11239443719387054,
"step": 1550,
"valid_targets_mean": 1491.8,
"valid_targets_min": 867
},
{
"epoch": 1.2653642653642654,
"grad_norm": 0.8084037583756437,
"learning_rate": 3.921440983762624e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12547224760055542,
"step": 1555,
"valid_targets_mean": 1994.0,
"valid_targets_min": 790
},
{
"epoch": 1.2694342694342695,
"grad_norm": 0.7784763220071113,
"learning_rate": 3.920310902167245e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11351943016052246,
"step": 1560,
"valid_targets_mean": 1523.4,
"valid_targets_min": 896
},
{
"epoch": 1.2735042735042734,
"grad_norm": 0.7880339591266707,
"learning_rate": 3.919172915518271e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11668528616428375,
"step": 1565,
"valid_targets_mean": 1790.1,
"valid_targets_min": 1009
},
{
"epoch": 1.2775742775742776,
"grad_norm": 0.7920585958427674,
"learning_rate": 3.918027028500282e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0921139121055603,
"step": 1570,
"valid_targets_mean": 1394.0,
"valid_targets_min": 717
},
{
"epoch": 1.2816442816442817,
"grad_norm": 0.925447932695446,
"learning_rate": 3.916873245830376e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08572347462177277,
"step": 1575,
"valid_targets_mean": 1129.0,
"valid_targets_min": 659
},
{
"epoch": 1.2857142857142856,
"grad_norm": 0.9814126638216883,
"learning_rate": 3.915711572258157e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10210913419723511,
"step": 1580,
"valid_targets_mean": 1466.9,
"valid_targets_min": 642
},
{
"epoch": 1.2897842897842897,
"grad_norm": 0.7835577295777144,
"learning_rate": 3.914542012565711e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07693362236022949,
"step": 1585,
"valid_targets_mean": 1129.4,
"valid_targets_min": 765
},
{
"epoch": 1.2938542938542938,
"grad_norm": 0.9086732320776554,
"learning_rate": 3.913364571567586e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10597139596939087,
"step": 1590,
"valid_targets_mean": 1322.8,
"valid_targets_min": 631
},
{
"epoch": 1.297924297924298,
"grad_norm": 0.9559891752335423,
"learning_rate": 3.912179254110777e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1286805272102356,
"step": 1595,
"valid_targets_mean": 1612.0,
"valid_targets_min": 623
},
{
"epoch": 1.301994301994302,
"grad_norm": 0.7298047621289229,
"learning_rate": 3.9109860650747e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08292436599731445,
"step": 1600,
"valid_targets_mean": 1402.1,
"valid_targets_min": 940
},
{
"epoch": 1.306064306064306,
"grad_norm": 0.712092191185825,
"learning_rate": 3.9097850093711775e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09930809587240219,
"step": 1605,
"valid_targets_mean": 1337.8,
"valid_targets_min": 776
},
{
"epoch": 1.3101343101343101,
"grad_norm": 0.8337686772674006,
"learning_rate": 3.908576091944412e-05,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12775862216949463,
"step": 1610,
"valid_targets_mean": 1525.5,
"valid_targets_min": 623
},
{
"epoch": 1.3142043142043143,
"grad_norm": 0.8033816144064492,
"learning_rate": 3.907359317770973e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12140291929244995,
"step": 1615,
"valid_targets_mean": 1441.0,
"valid_targets_min": 693
},
{
"epoch": 1.3182743182743182,
"grad_norm": 0.8666725972794019,
"learning_rate": 3.90613469185977e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06115573272109032,
"step": 1620,
"valid_targets_mean": 847.9,
"valid_targets_min": 611
},
{
"epoch": 1.3223443223443223,
"grad_norm": 0.831110404158148,
"learning_rate": 3.904902219252035e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11510695517063141,
"step": 1625,
"valid_targets_mean": 1524.9,
"valid_targets_min": 793
},
{
"epoch": 1.3264143264143264,
"grad_norm": 0.747854141552853,
"learning_rate": 3.903661905021302e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11657039076089859,
"step": 1630,
"valid_targets_mean": 1779.4,
"valid_targets_min": 563
},
{
"epoch": 1.3304843304843303,
"grad_norm": 0.7620995195915982,
"learning_rate": 3.9024137542733846e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12204901874065399,
"step": 1635,
"valid_targets_mean": 1741.2,
"valid_targets_min": 1341
},
{
"epoch": 1.3345543345543345,
"grad_norm": 0.8238415295946188,
"learning_rate": 3.9011577721463574e-05,
"loss": 0.2143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12938036024570465,
"step": 1640,
"valid_targets_mean": 1875.6,
"valid_targets_min": 1107
},
{
"epoch": 1.3386243386243386,
"grad_norm": 0.799416998929109,
"learning_rate": 3.899893963810531e-05,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1031196340918541,
"step": 1645,
"valid_targets_mean": 1419.5,
"valid_targets_min": 680
},
{
"epoch": 1.3426943426943427,
"grad_norm": 0.7699078977660259,
"learning_rate": 3.898622334468435e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14640526473522186,
"step": 1650,
"valid_targets_mean": 1968.2,
"valid_targets_min": 981
},
{
"epoch": 1.3467643467643469,
"grad_norm": 0.7511380642686718,
"learning_rate": 3.897342889354793e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10663345456123352,
"step": 1655,
"valid_targets_mean": 1568.9,
"valid_targets_min": 937
},
{
"epoch": 1.3508343508343508,
"grad_norm": 0.8037134681077442,
"learning_rate": 3.896055633736504e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11559002846479416,
"step": 1660,
"valid_targets_mean": 1645.2,
"valid_targets_min": 804
},
{
"epoch": 1.354904354904355,
"grad_norm": 0.7949561381518031,
"learning_rate": 3.894760572912618e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1040218248963356,
"step": 1665,
"valid_targets_mean": 1574.9,
"valid_targets_min": 1019
},
{
"epoch": 1.358974358974359,
"grad_norm": 0.7793788473775995,
"learning_rate": 3.8934577122143156e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09460228681564331,
"step": 1670,
"valid_targets_mean": 1121.6,
"valid_targets_min": 882
},
{
"epoch": 1.363044363044363,
"grad_norm": 0.7618292018526198,
"learning_rate": 3.892147057004888e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11588133871555328,
"step": 1675,
"valid_targets_mean": 1818.1,
"valid_targets_min": 1168
},
{
"epoch": 1.367114367114367,
"grad_norm": 0.9942145132530782,
"learning_rate": 3.89082861267971e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09862836450338364,
"step": 1680,
"valid_targets_mean": 1417.8,
"valid_targets_min": 678
},
{
"epoch": 1.3711843711843712,
"grad_norm": 0.8502030826682979,
"learning_rate": 3.889502384666223e-05,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08241011202335358,
"step": 1685,
"valid_targets_mean": 1051.0,
"valid_targets_min": 676
},
{
"epoch": 1.3752543752543753,
"grad_norm": 0.696356628682868,
"learning_rate": 3.8881683784239086e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09263870120048523,
"step": 1690,
"valid_targets_mean": 1431.1,
"valid_targets_min": 794
},
{
"epoch": 1.3793243793243795,
"grad_norm": 0.7609564628672522,
"learning_rate": 3.8868265994442694e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11136119812726974,
"step": 1695,
"valid_targets_mean": 1486.9,
"valid_targets_min": 742
},
{
"epoch": 1.3833943833943834,
"grad_norm": 0.779149722488893,
"learning_rate": 3.8854770532508036e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12626802921295166,
"step": 1700,
"valid_targets_mean": 1734.5,
"valid_targets_min": 741
},
{
"epoch": 1.3874643874643875,
"grad_norm": 0.8189444335835692,
"learning_rate": 3.884119745398984e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12554654479026794,
"step": 1705,
"valid_targets_mean": 1712.5,
"valid_targets_min": 1157
},
{
"epoch": 1.3915343915343916,
"grad_norm": 0.7562880779738609,
"learning_rate": 3.882754681476235e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14017203450202942,
"step": 1710,
"valid_targets_mean": 1723.8,
"valid_targets_min": 862
},
{
"epoch": 1.3956043956043955,
"grad_norm": 0.789327271767066,
"learning_rate": 3.881381867101908e-05,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1333657205104828,
"step": 1715,
"valid_targets_mean": 1633.1,
"valid_targets_min": 1019
},
{
"epoch": 1.3996743996743997,
"grad_norm": 0.6904489176477637,
"learning_rate": 3.880001307927262e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1002424880862236,
"step": 1720,
"valid_targets_mean": 1376.1,
"valid_targets_min": 1058
},
{
"epoch": 1.4037444037444038,
"grad_norm": 0.7331099974034027,
"learning_rate": 3.878613009635434e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11483565717935562,
"step": 1725,
"valid_targets_mean": 1576.5,
"valid_targets_min": 618
},
{
"epoch": 1.4078144078144077,
"grad_norm": 0.7374050495229207,
"learning_rate": 3.877216977941424e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12511426210403442,
"step": 1730,
"valid_targets_mean": 1615.8,
"valid_targets_min": 629
},
{
"epoch": 1.4118844118844118,
"grad_norm": 0.7263856360035532,
"learning_rate": 3.875813218592063e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11008419096469879,
"step": 1735,
"valid_targets_mean": 1881.2,
"valid_targets_min": 1167
},
{
"epoch": 1.415954415954416,
"grad_norm": 0.7714742596712739,
"learning_rate": 3.874401737365996e-05,
"loss": 0.2132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11159549653530121,
"step": 1740,
"valid_targets_mean": 1367.2,
"valid_targets_min": 699
},
{
"epoch": 1.42002442002442,
"grad_norm": 0.768333986171705,
"learning_rate": 3.872982540073654e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08359374105930328,
"step": 1745,
"valid_targets_mean": 1174.9,
"valid_targets_min": 679
},
{
"epoch": 1.4240944240944242,
"grad_norm": 0.730500600250479,
"learning_rate": 3.871555632557232e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09920322895050049,
"step": 1750,
"valid_targets_mean": 1556.2,
"valid_targets_min": 504
},
{
"epoch": 1.4281644281644281,
"grad_norm": 0.8117781426270219,
"learning_rate": 3.870121020690663e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11729609966278076,
"step": 1755,
"valid_targets_mean": 1885.0,
"valid_targets_min": 1331
},
{
"epoch": 1.4322344322344323,
"grad_norm": 0.7215350454916396,
"learning_rate": 3.868678710379599e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07775722444057465,
"step": 1760,
"valid_targets_mean": 1306.1,
"valid_targets_min": 661
},
{
"epoch": 1.4363044363044364,
"grad_norm": 0.837829363749683,
"learning_rate": 3.86722870756138e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08048004657030106,
"step": 1765,
"valid_targets_mean": 1330.1,
"valid_targets_min": 958
},
{
"epoch": 1.4403744403744403,
"grad_norm": 0.6691854525025749,
"learning_rate": 3.865771018205014e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08131928741931915,
"step": 1770,
"valid_targets_mean": 1465.0,
"valid_targets_min": 963
},
{
"epoch": 1.4444444444444444,
"grad_norm": 0.8158369333281974,
"learning_rate": 3.864305648311149e-05,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10300800949335098,
"step": 1775,
"valid_targets_mean": 1428.0,
"valid_targets_min": 793
},
{
"epoch": 1.4485144485144485,
"grad_norm": 0.948520302318546,
"learning_rate": 3.8628326039120524e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13352897763252258,
"step": 1780,
"valid_targets_mean": 1633.1,
"valid_targets_min": 917
},
{
"epoch": 1.4525844525844525,
"grad_norm": 0.7365952174032329,
"learning_rate": 3.861351891071583e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08271881937980652,
"step": 1785,
"valid_targets_mean": 1246.5,
"valid_targets_min": 872
},
{
"epoch": 1.4566544566544566,
"grad_norm": 0.6720445528339655,
"learning_rate": 3.8598635158851694e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10842913389205933,
"step": 1790,
"valid_targets_mean": 1903.6,
"valid_targets_min": 1220
},
{
"epoch": 1.4607244607244607,
"grad_norm": 0.7972994996959792,
"learning_rate": 3.858367484479779e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09797993302345276,
"step": 1795,
"valid_targets_mean": 1391.6,
"valid_targets_min": 712
},
{
"epoch": 1.4647944647944648,
"grad_norm": 0.8151552299642496,
"learning_rate": 3.856863803013897e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11069940030574799,
"step": 1800,
"valid_targets_mean": 1295.0,
"valid_targets_min": 605
},
{
"epoch": 1.468864468864469,
"grad_norm": 0.6855785516547465,
"learning_rate": 3.855352477677504e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06866128742694855,
"step": 1805,
"valid_targets_mean": 1414.8,
"valid_targets_min": 746
},
{
"epoch": 1.4729344729344729,
"grad_norm": 0.8055255610517995,
"learning_rate": 3.853833514692044e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0873202309012413,
"step": 1810,
"valid_targets_mean": 1059.4,
"valid_targets_min": 723
},
{
"epoch": 1.477004477004477,
"grad_norm": 0.7866122138481166,
"learning_rate": 3.852306920310401e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11211128532886505,
"step": 1815,
"valid_targets_mean": 1634.2,
"valid_targets_min": 1327
},
{
"epoch": 1.4810744810744811,
"grad_norm": 0.7173011268227322,
"learning_rate": 3.850772700816877e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09077475965023041,
"step": 1820,
"valid_targets_mean": 1412.5,
"valid_targets_min": 902
},
{
"epoch": 1.485144485144485,
"grad_norm": 0.6952841023611934,
"learning_rate": 3.8492308625271596e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09670276939868927,
"step": 1825,
"valid_targets_mean": 1558.8,
"valid_targets_min": 803
},
{
"epoch": 1.4892144892144892,
"grad_norm": 0.7685210240880278,
"learning_rate": 3.8476814117883034e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10378531366586685,
"step": 1830,
"valid_targets_mean": 1441.2,
"valid_targets_min": 1079
},
{
"epoch": 1.4932844932844933,
"grad_norm": 0.7239079288465091,
"learning_rate": 3.846124354978697e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09632142633199692,
"step": 1835,
"valid_targets_mean": 1449.8,
"valid_targets_min": 1263
},
{
"epoch": 1.4973544973544972,
"grad_norm": 0.7850402456186506,
"learning_rate": 3.8445596985080404e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10480426251888275,
"step": 1840,
"valid_targets_mean": 1487.4,
"valid_targets_min": 844
},
{
"epoch": 1.5014245014245016,
"grad_norm": 0.8068791427285449,
"learning_rate": 3.842987448817319e-05,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09140418469905853,
"step": 1845,
"valid_targets_mean": 1421.4,
"valid_targets_min": 667
},
{
"epoch": 1.5054945054945055,
"grad_norm": 0.7097429620733522,
"learning_rate": 3.841407612378775e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12428690493106842,
"step": 1850,
"valid_targets_mean": 1822.6,
"valid_targets_min": 1041
},
{
"epoch": 1.5095645095645096,
"grad_norm": 0.7932172765143252,
"learning_rate": 3.839820195695883e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09613991528749466,
"step": 1855,
"valid_targets_mean": 1327.4,
"valid_targets_min": 777
},
{
"epoch": 1.5136345136345137,
"grad_norm": 0.7320076010626049,
"learning_rate": 3.8382252053033196e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10572035610675812,
"step": 1860,
"valid_targets_mean": 1823.8,
"valid_targets_min": 1283
},
{
"epoch": 1.5177045177045176,
"grad_norm": 0.806858170502788,
"learning_rate": 3.836622647766943e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06952077150344849,
"step": 1865,
"valid_targets_mean": 924.0,
"valid_targets_min": 620
},
{
"epoch": 1.5217745217745218,
"grad_norm": 0.7219548062410487,
"learning_rate": 3.835012529683757e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08829911798238754,
"step": 1870,
"valid_targets_mean": 1480.2,
"valid_targets_min": 656
},
{
"epoch": 1.525844525844526,
"grad_norm": 0.6994940063547743,
"learning_rate": 3.833394857681894e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08126124739646912,
"step": 1875,
"valid_targets_mean": 1415.5,
"valid_targets_min": 697
},
{
"epoch": 1.5299145299145298,
"grad_norm": 0.7327643766970442,
"learning_rate": 3.831769638420577e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1019296646118164,
"step": 1880,
"valid_targets_mean": 1655.8,
"valid_targets_min": 816
},
{
"epoch": 1.533984533984534,
"grad_norm": 0.6800577601183724,
"learning_rate": 3.830136878590104e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09412302821874619,
"step": 1885,
"valid_targets_mean": 1553.0,
"valid_targets_min": 850
},
{
"epoch": 1.538054538054538,
"grad_norm": 0.7426379902022742,
"learning_rate": 3.8284965849118066e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09913598001003265,
"step": 1890,
"valid_targets_mean": 1353.9,
"valid_targets_min": 747
},
{
"epoch": 1.542124542124542,
"grad_norm": 0.7457989847263609,
"learning_rate": 3.826848764138036e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08886919915676117,
"step": 1895,
"valid_targets_mean": 1420.9,
"valid_targets_min": 933
},
{
"epoch": 1.5461945461945463,
"grad_norm": 0.7559545112406654,
"learning_rate": 3.825193423052127e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09691812098026276,
"step": 1900,
"valid_targets_mean": 1394.9,
"valid_targets_min": 827
},
{
"epoch": 1.5502645502645502,
"grad_norm": 0.6854552164584192,
"learning_rate": 3.823530568468371e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08764408528804779,
"step": 1905,
"valid_targets_mean": 1383.2,
"valid_targets_min": 909
},
{
"epoch": 1.5543345543345544,
"grad_norm": 0.6804870010828482,
"learning_rate": 3.821860207231991e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11076577752828598,
"step": 1910,
"valid_targets_mean": 1682.4,
"valid_targets_min": 1094
},
{
"epoch": 1.5584045584045585,
"grad_norm": 0.8066726711083975,
"learning_rate": 3.82018234621911e-05,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09034565091133118,
"step": 1915,
"valid_targets_mean": 1118.4,
"valid_targets_min": 720
},
{
"epoch": 1.5624745624745624,
"grad_norm": 0.7147210480241867,
"learning_rate": 3.818496992336725e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10571155697107315,
"step": 1920,
"valid_targets_mean": 1538.2,
"valid_targets_min": 610
},
{
"epoch": 1.5665445665445665,
"grad_norm": 0.6741394266281067,
"learning_rate": 3.816804152522678e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10726112127304077,
"step": 1925,
"valid_targets_mean": 1570.1,
"valid_targets_min": 713
},
{
"epoch": 1.5706145706145707,
"grad_norm": 0.6935025181842417,
"learning_rate": 3.815103833745626e-05,
"loss": 0.2066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09748126566410065,
"step": 1930,
"valid_targets_mean": 1537.8,
"valid_targets_min": 874
},
{
"epoch": 1.5746845746845746,
"grad_norm": 0.6821876374487306,
"learning_rate": 3.8133960430050135e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09882050007581711,
"step": 1935,
"valid_targets_mean": 1471.2,
"valid_targets_min": 765
},
{
"epoch": 1.578754578754579,
"grad_norm": 0.6990112986801081,
"learning_rate": 3.811680787331047e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08577939867973328,
"step": 1940,
"valid_targets_mean": 1254.4,
"valid_targets_min": 816
},
{
"epoch": 1.5828245828245828,
"grad_norm": 0.7102883473320752,
"learning_rate": 3.809958073784658e-05,
"loss": 0.2058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0998358279466629,
"step": 1945,
"valid_targets_mean": 1482.9,
"valid_targets_min": 1182
},
{
"epoch": 1.5868945868945867,
"grad_norm": 0.7009814403089336,
"learning_rate": 3.8082279094574815e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11195679008960724,
"step": 1950,
"valid_targets_mean": 1583.2,
"valid_targets_min": 363
},
{
"epoch": 1.590964590964591,
"grad_norm": 0.41631203954390233,
"learning_rate": 3.8064903014718245e-05,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07122399657964706,
"step": 1955,
"valid_targets_mean": 3710.1,
"valid_targets_min": 3074
},
{
"epoch": 1.595034595034595,
"grad_norm": 0.4600103764733667,
"learning_rate": 3.804745256980634e-05,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06652016937732697,
"step": 1960,
"valid_targets_mean": 2577.6,
"valid_targets_min": 700
},
{
"epoch": 1.5991045991045991,
"grad_norm": 0.4537614450983102,
"learning_rate": 3.80299278316747e-05,
"loss": 0.1233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05843440815806389,
"step": 1965,
"valid_targets_mean": 3309.8,
"valid_targets_min": 803
},
{
"epoch": 1.6031746031746033,
"grad_norm": 0.43458913842163255,
"learning_rate": 3.801232887246479e-05,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06071528047323227,
"step": 1970,
"valid_targets_mean": 2484.8,
"valid_targets_min": 920
},
{
"epoch": 1.6072446072446072,
"grad_norm": 0.42621344020743934,
"learning_rate": 3.799465576462357e-05,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06493829935789108,
"step": 1975,
"valid_targets_mean": 3095.1,
"valid_targets_min": 806
},
{
"epoch": 1.6113146113146113,
"grad_norm": 0.7467123259446526,
"learning_rate": 3.7976908580903246e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10322582721710205,
"step": 1980,
"valid_targets_mean": 1663.1,
"valid_targets_min": 718
},
{
"epoch": 1.6153846153846154,
"grad_norm": 0.41841694093835413,
"learning_rate": 3.7959087394360974e-05,
"loss": 0.1278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0684170350432396,
"step": 1985,
"valid_targets_mean": 3443.2,
"valid_targets_min": 1133
},
{
"epoch": 1.6194546194546193,
"grad_norm": 0.4482119640964086,
"learning_rate": 3.794119227835854e-05,
"loss": 0.1293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05158419907093048,
"step": 1990,
"valid_targets_mean": 1609.9,
"valid_targets_min": 859
},
{
"epoch": 1.6235246235246237,
"grad_norm": 0.2808356049969262,
"learning_rate": 3.792322330656206e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045812997967004776,
"step": 1995,
"valid_targets_mean": 5572.1,
"valid_targets_min": 5150
},
{
"epoch": 1.6275946275946276,
"grad_norm": 0.38378216926736985,
"learning_rate": 3.790518055294168e-05,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07117560505867004,
"step": 2000,
"valid_targets_mean": 3950.0,
"valid_targets_min": 502
},
{
"epoch": 1.6316646316646317,
"grad_norm": 0.3830231524830745,
"learning_rate": 3.788706409177129e-05,
"loss": 0.1128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06173840910196304,
"step": 2005,
"valid_targets_mean": 3669.2,
"valid_targets_min": 600
},
{
"epoch": 1.6357346357346358,
"grad_norm": 0.35711060786805376,
"learning_rate": 3.7868873997628174e-05,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050001971423625946,
"step": 2010,
"valid_targets_mean": 2980.4,
"valid_targets_min": 518
},
{
"epoch": 1.6398046398046398,
"grad_norm": 0.3974333252134189,
"learning_rate": 3.7850610345392735e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06219826638698578,
"step": 2015,
"valid_targets_mean": 3675.4,
"valid_targets_min": 549
},
{
"epoch": 1.6438746438746439,
"grad_norm": 0.3281743505589197,
"learning_rate": 3.7832273210248214e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045098382979631424,
"step": 2020,
"valid_targets_mean": 4013.2,
"valid_targets_min": 3548
},
{
"epoch": 1.647944647944648,
"grad_norm": 0.5366337338266325,
"learning_rate": 3.7813862667680304e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061837535351514816,
"step": 2025,
"valid_targets_mean": 2000.5,
"valid_targets_min": 644
},
{
"epoch": 1.652014652014652,
"grad_norm": 0.34924838955717313,
"learning_rate": 3.7795378793476904e-05,
"loss": 0.0976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03679157420992851,
"step": 2030,
"valid_targets_mean": 2904.4,
"valid_targets_min": 720
},
{
"epoch": 1.656084656084656,
"grad_norm": 0.48035620858335015,
"learning_rate": 3.777682166372779e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04888860881328583,
"step": 2035,
"valid_targets_mean": 1487.6,
"valid_targets_min": 516
},
{
"epoch": 1.6601546601546602,
"grad_norm": 0.5576087684474084,
"learning_rate": 3.775819135482429e-05,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07822857797145844,
"step": 2040,
"valid_targets_mean": 2006.0,
"valid_targets_min": 557
},
{
"epoch": 1.664224664224664,
"grad_norm": 0.441534949218794,
"learning_rate": 3.773948794345899e-05,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07287167012691498,
"step": 2045,
"valid_targets_mean": 3359.2,
"valid_targets_min": 1086
},
{
"epoch": 1.6682946682946684,
"grad_norm": 0.4390733330236822,
"learning_rate": 3.7720711506625384e-05,
"loss": 0.1316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08404476940631866,
"step": 2050,
"valid_targets_mean": 2866.8,
"valid_targets_min": 1008
},
{
"epoch": 1.6723646723646723,
"grad_norm": 0.4736301286588309,
"learning_rate": 3.7701862121617595e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04762580618262291,
"step": 2055,
"valid_targets_mean": 3259.9,
"valid_targets_min": 2702
},
{
"epoch": 1.6764346764346765,
"grad_norm": 0.3397713444353576,
"learning_rate": 3.768293986603003e-05,
"loss": 0.1081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04629997909069061,
"step": 2060,
"valid_targets_mean": 4086.4,
"valid_targets_min": 3798
},
{
"epoch": 1.6805046805046806,
"grad_norm": 0.8340021398967473,
"learning_rate": 3.7663944817757094e-05,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10405413806438446,
"step": 2065,
"valid_targets_mean": 1020.8,
"valid_targets_min": 598
},
{
"epoch": 1.6845746845746845,
"grad_norm": 0.4169904470975252,
"learning_rate": 3.7644877054992814e-05,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047049522399902344,
"step": 2070,
"valid_targets_mean": 2028.4,
"valid_targets_min": 590
},
{
"epoch": 1.6886446886446886,
"grad_norm": 0.3457500004146195,
"learning_rate": 3.7625736656230576e-05,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06108832731842995,
"step": 2075,
"valid_targets_mean": 4046.9,
"valid_targets_min": 3390
},
{
"epoch": 1.6927146927146928,
"grad_norm": 0.6869412401670636,
"learning_rate": 3.760652370026277e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16195940971374512,
"step": 2080,
"valid_targets_mean": 2247.4,
"valid_targets_min": 984
},
{
"epoch": 1.6967846967846967,
"grad_norm": 0.40632518442102483,
"learning_rate": 3.758723826618045e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0758669525384903,
"step": 2085,
"valid_targets_mean": 3348.9,
"valid_targets_min": 2176
},
{
"epoch": 1.7008547008547008,
"grad_norm": 0.4606205763061986,
"learning_rate": 3.7567880433373066e-05,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060970671474933624,
"step": 2090,
"valid_targets_mean": 2385.1,
"valid_targets_min": 1074
},
{
"epoch": 1.704924704924705,
"grad_norm": 0.45654254366777014,
"learning_rate": 3.754845028152807e-05,
"loss": 0.1317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062153562903404236,
"step": 2095,
"valid_targets_mean": 3126.2,
"valid_targets_min": 1212
},
{
"epoch": 1.7089947089947088,
"grad_norm": 0.3935119632617659,
"learning_rate": 3.7528947890630635e-05,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06273317337036133,
"step": 2100,
"valid_targets_mean": 4386.0,
"valid_targets_min": 2258
},
{
"epoch": 1.7130647130647132,
"grad_norm": 0.30725829749200173,
"learning_rate": 3.750937334096331e-05,
"loss": 0.1001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07420308887958527,
"step": 2105,
"valid_targets_mean": 3738.9,
"valid_targets_min": 1466
},
{
"epoch": 1.717134717134717,
"grad_norm": 0.3408574469787128,
"learning_rate": 3.7489726713105673e-05,
"loss": 0.1222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05906776338815689,
"step": 2110,
"valid_targets_mean": 3522.6,
"valid_targets_min": 560
},
{
"epoch": 1.7212047212047212,
"grad_norm": 0.3873420033129566,
"learning_rate": 3.747000808793404e-05,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06194659322500229,
"step": 2115,
"valid_targets_mean": 3383.1,
"valid_targets_min": 1189
},
{
"epoch": 1.7252747252747254,
"grad_norm": 0.35534762128764597,
"learning_rate": 3.745021754662109e-05,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050105899572372437,
"step": 2120,
"valid_targets_mean": 3610.1,
"valid_targets_min": 2257
},
{
"epoch": 1.7293447293447293,
"grad_norm": 0.35587621922779594,
"learning_rate": 3.7430355170635536e-05,
"loss": 0.1049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040797870606184006,
"step": 2125,
"valid_targets_mean": 3479.8,
"valid_targets_min": 886
},
{
"epoch": 1.7334147334147334,
"grad_norm": 0.4101618167732939,
"learning_rate": 3.7410421041741846e-05,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05459919571876526,
"step": 2130,
"valid_targets_mean": 3346.6,
"valid_targets_min": 2409
},
{
"epoch": 1.7374847374847375,
"grad_norm": 0.3706410137638395,
"learning_rate": 3.7390415241999815e-05,
"loss": 0.1038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049584001302719116,
"step": 2135,
"valid_targets_mean": 3552.0,
"valid_targets_min": 2309
},
{
"epoch": 1.7415547415547414,
"grad_norm": 0.6514439786770229,
"learning_rate": 3.737033785376431e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11145202815532684,
"step": 2140,
"valid_targets_mean": 2149.8,
"valid_targets_min": 645
},
{
"epoch": 1.7456247456247458,
"grad_norm": 0.3388516246206135,
"learning_rate": 3.735018895968487e-05,
"loss": 0.0977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04621146619319916,
"step": 2145,
"valid_targets_mean": 3310.2,
"valid_targets_min": 545
},
{
"epoch": 1.7496947496947497,
"grad_norm": 0.4563091012984944,
"learning_rate": 3.73299686427054e-05,
"loss": 0.1009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05684323236346245,
"step": 2150,
"valid_targets_mean": 2458.4,
"valid_targets_min": 667
},
{
"epoch": 1.7537647537647536,
"grad_norm": 0.329941297300451,
"learning_rate": 3.730967698606383e-05,
"loss": 0.0983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046611517667770386,
"step": 2155,
"valid_targets_mean": 3501.5,
"valid_targets_min": 2353
},
{
"epoch": 1.757834757834758,
"grad_norm": 0.39991464682747385,
"learning_rate": 3.728931407329174e-05,
"loss": 0.1032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07516320049762726,
"step": 2160,
"valid_targets_mean": 3220.2,
"valid_targets_min": 792
},
{
"epoch": 1.7619047619047619,
"grad_norm": 0.33577937245255396,
"learning_rate": 3.7268879988214075e-05,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04279305413365364,
"step": 2165,
"valid_targets_mean": 3818.5,
"valid_targets_min": 3276
},
{
"epoch": 1.765974765974766,
"grad_norm": 0.4325931023841163,
"learning_rate": 3.724837481494874e-05,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06765176355838776,
"step": 2170,
"valid_targets_mean": 2390.9,
"valid_targets_min": 647
},
{
"epoch": 1.7700447700447701,
"grad_norm": 0.5070623066629864,
"learning_rate": 3.722779863790626e-05,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06652006506919861,
"step": 2175,
"valid_targets_mean": 1500.6,
"valid_targets_min": 673
},
{
"epoch": 1.774114774114774,
"grad_norm": 0.6537069454458774,
"learning_rate": 3.7207151541789505e-05,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.113385409116745,
"step": 2180,
"valid_targets_mean": 1711.2,
"valid_targets_min": 702
},
{
"epoch": 1.7781847781847782,
"grad_norm": 0.44224511896857577,
"learning_rate": 3.7186433611593225e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07473345100879669,
"step": 2185,
"valid_targets_mean": 3036.1,
"valid_targets_min": 945
},
{
"epoch": 1.7822547822547823,
"grad_norm": 0.48920469501680053,
"learning_rate": 3.716564493260381e-05,
"loss": 0.119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08563308417797089,
"step": 2190,
"valid_targets_mean": 3317.2,
"valid_targets_min": 2265
},
{
"epoch": 1.7863247863247862,
"grad_norm": 0.32615432603009253,
"learning_rate": 3.714478559039887e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058499690145254135,
"step": 2195,
"valid_targets_mean": 3875.2,
"valid_targets_min": 3051
},
{
"epoch": 1.7903947903947905,
"grad_norm": 0.5285568387969577,
"learning_rate": 3.712385567084689e-05,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08171027898788452,
"step": 2200,
"valid_targets_mean": 2069.8,
"valid_targets_min": 523
},
{
"epoch": 1.7944647944647945,
"grad_norm": 0.3459525440694431,
"learning_rate": 3.710285526010693e-05,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04602465033531189,
"step": 2205,
"valid_targets_mean": 1640.8,
"valid_targets_min": 468
},
{
"epoch": 1.7985347985347986,
"grad_norm": 0.25004285177963237,
"learning_rate": 3.7081784444628185e-05,
"loss": 0.1158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03536680340766907,
"step": 2210,
"valid_targets_mean": 4435.1,
"valid_targets_min": 885
},
{
"epoch": 1.8026048026048027,
"grad_norm": 0.38886600769121415,
"learning_rate": 3.7060643311149706e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041570305824279785,
"step": 2215,
"valid_targets_mean": 1889.2,
"valid_targets_min": 546
},
{
"epoch": 1.8066748066748066,
"grad_norm": 0.32987051157703745,
"learning_rate": 3.703943194670001e-05,
"loss": 0.1019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059109874069690704,
"step": 2220,
"valid_targets_mean": 4257.1,
"valid_targets_min": 2414
},
{
"epoch": 1.8107448107448108,
"grad_norm": 0.551577193902464,
"learning_rate": 3.7018150438596696e-05,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061953105032444,
"step": 2225,
"valid_targets_mean": 1502.4,
"valid_targets_min": 697
},
{
"epoch": 1.8148148148148149,
"grad_norm": 0.43626117102890194,
"learning_rate": 3.6996798874446144e-05,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05732385441660881,
"step": 2230,
"valid_targets_mean": 3466.0,
"valid_targets_min": 2777
},
{
"epoch": 1.8188848188848188,
"grad_norm": 0.4137126451869474,
"learning_rate": 3.6975377342143105e-05,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06378593295812607,
"step": 2235,
"valid_targets_mean": 3982.1,
"valid_targets_min": 3061
},
{
"epoch": 1.822954822954823,
"grad_norm": 0.33696208651772863,
"learning_rate": 3.695388592987036e-05,
"loss": 0.1067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05193319916725159,
"step": 2240,
"valid_targets_mean": 2788.0,
"valid_targets_min": 868
},
{
"epoch": 1.827024827024827,
"grad_norm": 0.37878300759015127,
"learning_rate": 3.693232472609837e-05,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04331493750214577,
"step": 2245,
"valid_targets_mean": 2120.6,
"valid_targets_min": 752
},
{
"epoch": 1.831094831094831,
"grad_norm": 0.35149923790855736,
"learning_rate": 3.6910693819584865e-05,
"loss": 0.1236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05358132719993591,
"step": 2250,
"valid_targets_mean": 3477.1,
"valid_targets_min": 1141
},
{
"epoch": 1.8351648351648353,
"grad_norm": 0.31501331438328894,
"learning_rate": 3.688899329937454e-05,
"loss": 0.0938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05189646780490875,
"step": 2255,
"valid_targets_mean": 3888.4,
"valid_targets_min": 3540
},
{
"epoch": 1.8392348392348392,
"grad_norm": 0.3667292332003592,
"learning_rate": 3.6867223254798645e-05,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04574829339981079,
"step": 2260,
"valid_targets_mean": 3086.8,
"valid_targets_min": 773
},
{
"epoch": 1.8433048433048433,
"grad_norm": 0.3290532742643368,
"learning_rate": 3.6845383775474626e-05,
"loss": 0.1172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03846554830670357,
"step": 2265,
"valid_targets_mean": 3558.6,
"valid_targets_min": 2587
},
{
"epoch": 1.8473748473748475,
"grad_norm": 0.3938162713057422,
"learning_rate": 3.6823474951305766e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05593733489513397,
"step": 2270,
"valid_targets_mean": 2688.9,
"valid_targets_min": 773
},
{
"epoch": 1.8514448514448514,
"grad_norm": 0.4221991891103622,
"learning_rate": 3.6801496872480825e-05,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06380049139261246,
"step": 2275,
"valid_targets_mean": 3734.4,
"valid_targets_min": 3068
},
{
"epoch": 1.8555148555148555,
"grad_norm": 0.608114991462476,
"learning_rate": 3.6779449629473615e-05,
"loss": 0.1291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0737733393907547,
"step": 2280,
"valid_targets_mean": 1816.1,
"valid_targets_min": 893
},
{
"epoch": 1.8595848595848596,
"grad_norm": 0.5129055915940605,
"learning_rate": 3.675733331304271e-05,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05952981114387512,
"step": 2285,
"valid_targets_mean": 1444.4,
"valid_targets_min": 708
},
{
"epoch": 1.8636548636548635,
"grad_norm": 0.4126348530013301,
"learning_rate": 3.6735148014230985e-05,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04681888595223427,
"step": 2290,
"valid_targets_mean": 1768.8,
"valid_targets_min": 617
},
{
"epoch": 1.8677248677248677,
"grad_norm": 0.4275179875164524,
"learning_rate": 3.671289382436532e-05,
"loss": 0.1124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05094176530838013,
"step": 2295,
"valid_targets_mean": 2634.9,
"valid_targets_min": 720
},
{
"epoch": 1.8717948717948718,
"grad_norm": 0.5049917920987161,
"learning_rate": 3.669057083505617e-05,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06733274459838867,
"step": 2300,
"valid_targets_mean": 1836.2,
"valid_targets_min": 785
},
{
"epoch": 1.8758648758648757,
"grad_norm": 0.5528905832066613,
"learning_rate": 3.6668179138197205e-05,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10168108344078064,
"step": 2305,
"valid_targets_mean": 2148.2,
"valid_targets_min": 765
},
{
"epoch": 1.87993487993488,
"grad_norm": 0.299832096960279,
"learning_rate": 3.664571882596495e-05,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033232755959033966,
"step": 2310,
"valid_targets_mean": 3639.2,
"valid_targets_min": 2863
},
{
"epoch": 1.884004884004884,
"grad_norm": 0.36729005263055425,
"learning_rate": 3.662318999081837e-05,
"loss": 0.1037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03816433623433113,
"step": 2315,
"valid_targets_mean": 3033.4,
"valid_targets_min": 555
},
{
"epoch": 1.888074888074888,
"grad_norm": 0.43795223384191606,
"learning_rate": 3.660059272549852e-05,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06973383575677872,
"step": 2320,
"valid_targets_mean": 2346.6,
"valid_targets_min": 721
},
{
"epoch": 1.8921448921448922,
"grad_norm": 0.33790000025819755,
"learning_rate": 3.657792712302814e-05,
"loss": 0.0941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051636915653944016,
"step": 2325,
"valid_targets_mean": 4902.1,
"valid_targets_min": 3640
},
{
"epoch": 1.8962148962148961,
"grad_norm": 0.3604771168113708,
"learning_rate": 3.655519327671129e-05,
"loss": 0.0961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05189387500286102,
"step": 2330,
"valid_targets_mean": 4536.6,
"valid_targets_min": 2020
},
{
"epoch": 1.9002849002849003,
"grad_norm": 0.33562019525922326,
"learning_rate": 3.6532391280132964e-05,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03787705674767494,
"step": 2335,
"valid_targets_mean": 3218.6,
"valid_targets_min": 739
},
{
"epoch": 1.9043549043549044,
"grad_norm": 0.3743647264168468,
"learning_rate": 3.650952122715869e-05,
"loss": 0.1353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060260578989982605,
"step": 2340,
"valid_targets_mean": 3774.6,
"valid_targets_min": 2945
},
{
"epoch": 1.9084249084249083,
"grad_norm": 0.37262671797339586,
"learning_rate": 3.648658321193415e-05,
"loss": 0.1104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05858001112937927,
"step": 2345,
"valid_targets_mean": 3045.4,
"valid_targets_min": 704
},
{
"epoch": 1.9124949124949127,
"grad_norm": 0.35884300375055905,
"learning_rate": 3.646357732888482e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04959436506032944,
"step": 2350,
"valid_targets_mean": 2492.8,
"valid_targets_min": 774
},
{
"epoch": 1.9165649165649166,
"grad_norm": 0.3589263199724622,
"learning_rate": 3.644050367271553e-05,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04746074602007866,
"step": 2355,
"valid_targets_mean": 2564.6,
"valid_targets_min": 485
},
{
"epoch": 1.9206349206349205,
"grad_norm": 0.406490304131688,
"learning_rate": 3.641736233841012e-05,
"loss": 0.106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046355560421943665,
"step": 2360,
"valid_targets_mean": 3002.5,
"valid_targets_min": 1048
},
{
"epoch": 1.9247049247049248,
"grad_norm": 0.5534145172199101,
"learning_rate": 3.639415342123101e-05,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050700727850198746,
"step": 2365,
"valid_targets_mean": 2588.5,
"valid_targets_min": 722
},
{
"epoch": 1.9287749287749287,
"grad_norm": 0.4908901714271384,
"learning_rate": 3.637087701671885e-05,
"loss": 0.1188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06826741248369217,
"step": 2370,
"valid_targets_mean": 1443.8,
"valid_targets_min": 865
},
{
"epoch": 1.9328449328449329,
"grad_norm": 0.4557072327685435,
"learning_rate": 3.63475332206921e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061702802777290344,
"step": 2375,
"valid_targets_mean": 2283.1,
"valid_targets_min": 675
},
{
"epoch": 1.936914936914937,
"grad_norm": 0.41528320209522723,
"learning_rate": 3.6324122129246616e-05,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052136339247226715,
"step": 2380,
"valid_targets_mean": 3202.0,
"valid_targets_min": 782
},
{
"epoch": 1.940984940984941,
"grad_norm": 0.4546869915497293,
"learning_rate": 3.630064383875533e-05,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05638446286320686,
"step": 2385,
"valid_targets_mean": 2586.9,
"valid_targets_min": 795
},
{
"epoch": 1.945054945054945,
"grad_norm": 0.4016367333178925,
"learning_rate": 3.627709844586774e-05,
"loss": 0.1106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05390872061252594,
"step": 2390,
"valid_targets_mean": 3345.4,
"valid_targets_min": 2017
},
{
"epoch": 1.9491249491249492,
"grad_norm": 0.37713484435403527,
"learning_rate": 3.6253486047509634e-05,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048263922333717346,
"step": 2395,
"valid_targets_mean": 1937.5,
"valid_targets_min": 798
},
{
"epoch": 1.953194953194953,
"grad_norm": 0.3376638144663447,
"learning_rate": 3.622980674088258e-05,
"loss": 0.0975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05167309567332268,
"step": 2400,
"valid_targets_mean": 3302.2,
"valid_targets_min": 860
},
{
"epoch": 1.9572649572649574,
"grad_norm": 0.3884117732632468,
"learning_rate": 3.620606062346361e-05,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05166970193386078,
"step": 2405,
"valid_targets_mean": 3287.2,
"valid_targets_min": 878
},
{
"epoch": 1.9613349613349613,
"grad_norm": 0.31443143791227623,
"learning_rate": 3.618224779300478e-05,
"loss": 0.0968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040656059980392456,
"step": 2410,
"valid_targets_mean": 3800.8,
"valid_targets_min": 2602
},
{
"epoch": 1.9654049654049655,
"grad_norm": 0.5020381670968926,
"learning_rate": 3.6158368347532755e-05,
"loss": 0.1142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06920788437128067,
"step": 2415,
"valid_targets_mean": 2853.9,
"valid_targets_min": 945
},
{
"epoch": 1.9694749694749696,
"grad_norm": 0.4185287229781912,
"learning_rate": 3.613442238534845e-05,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06565561890602112,
"step": 2420,
"valid_targets_mean": 3633.9,
"valid_targets_min": 2059
},
{
"epoch": 1.9735449735449735,
"grad_norm": 0.3315436014809084,
"learning_rate": 3.611041000502659e-05,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057864412665367126,
"step": 2425,
"valid_targets_mean": 4244.8,
"valid_targets_min": 2529
},
{
"epoch": 1.9776149776149776,
"grad_norm": 0.3194580707254878,
"learning_rate": 3.60863313054153e-05,
"loss": 0.0961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06427641212940216,
"step": 2430,
"valid_targets_mean": 4650.8,
"valid_targets_min": 892
},
{
"epoch": 1.9816849816849818,
"grad_norm": 0.25904177449049903,
"learning_rate": 3.6062186385635734e-05,
"loss": 0.1062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03253565728664398,
"step": 2435,
"valid_targets_mean": 4432.1,
"valid_targets_min": 1657
},
{
"epoch": 1.9857549857549857,
"grad_norm": 0.5544926636783111,
"learning_rate": 3.603797534508162e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13297711312770844,
"step": 2440,
"valid_targets_mean": 2023.0,
"valid_targets_min": 709
},
{
"epoch": 1.9898249898249898,
"grad_norm": 0.3150367876998634,
"learning_rate": 3.6013698283418896e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04680216312408447,
"step": 2445,
"valid_targets_mean": 3241.9,
"valid_targets_min": 527
},
{
"epoch": 1.993894993894994,
"grad_norm": 0.37009261570296975,
"learning_rate": 3.598935530058528e-05,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07674941420555115,
"step": 2450,
"valid_targets_mean": 3313.4,
"valid_targets_min": 2308
},
{
"epoch": 1.9979649979649978,
"grad_norm": 0.31909775388216893,
"learning_rate": 3.5964946496789836e-05,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05330783128738403,
"step": 2455,
"valid_targets_mean": 3463.5,
"valid_targets_min": 2883
},
{
"epoch": 2.0016280016280015,
"grad_norm": 0.4880867496018015,
"learning_rate": 3.5940471972512604e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10746130347251892,
"step": 2460,
"valid_targets_mean": 8514.0,
"valid_targets_min": 6788
},
{
"epoch": 2.005698005698006,
"grad_norm": 0.4659157360495663,
"learning_rate": 3.591593182850415e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11680585891008377,
"step": 2465,
"valid_targets_mean": 6668.0,
"valid_targets_min": 5933
},
{
"epoch": 2.0097680097680097,
"grad_norm": 0.43232390156358325,
"learning_rate": 3.5891326165785196e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10285025835037231,
"step": 2470,
"valid_targets_mean": 4107.0,
"valid_targets_min": 161
},
{
"epoch": 2.0138380138380136,
"grad_norm": 0.3634051714444297,
"learning_rate": 3.586665508564613e-05,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10061359405517578,
"step": 2475,
"valid_targets_mean": 7946.0,
"valid_targets_min": 5596
},
{
"epoch": 2.017908017908018,
"grad_norm": 0.37783795713600243,
"learning_rate": 3.5841918689646666e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1137465387582779,
"step": 2480,
"valid_targets_mean": 7392.8,
"valid_targets_min": 5629
},
{
"epoch": 2.021978021978022,
"grad_norm": 0.398790604122284,
"learning_rate": 3.581711707961539e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1090719997882843,
"step": 2485,
"valid_targets_mean": 6879.6,
"valid_targets_min": 5113
},
{
"epoch": 2.0260480260480263,
"grad_norm": 0.5235045531846907,
"learning_rate": 3.579225035764934e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11241519451141357,
"step": 2490,
"valid_targets_mean": 6919.5,
"valid_targets_min": 5080
},
{
"epoch": 2.03011803011803,
"grad_norm": 0.4208616593976156,
"learning_rate": 3.576731862611359e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09949975460767746,
"step": 2495,
"valid_targets_mean": 6377.0,
"valid_targets_min": 3939
},
{
"epoch": 2.034188034188034,
"grad_norm": 0.3829013185412194,
"learning_rate": 3.5742321987640826e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10645119845867157,
"step": 2500,
"valid_targets_mean": 6392.2,
"valid_targets_min": 4355
},
{
"epoch": 2.0382580382580384,
"grad_norm": 0.44985938212529025,
"learning_rate": 3.571726054513093e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12094033509492874,
"step": 2505,
"valid_targets_mean": 5196.5,
"valid_targets_min": 137
},
{
"epoch": 2.0423280423280423,
"grad_norm": 0.34320734656442425,
"learning_rate": 3.569213440175057e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09449905157089233,
"step": 2510,
"valid_targets_mean": 7344.4,
"valid_targets_min": 5244
},
{
"epoch": 2.0463980463980462,
"grad_norm": 0.32668719505554467,
"learning_rate": 3.566694366093272e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08982042968273163,
"step": 2515,
"valid_targets_mean": 7921.0,
"valid_targets_min": 5311
},
{
"epoch": 2.0504680504680506,
"grad_norm": 0.3852739489735939,
"learning_rate": 3.564168842637631e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10812553018331528,
"step": 2520,
"valid_targets_mean": 7931.2,
"valid_targets_min": 6015
},
{
"epoch": 2.0545380545380545,
"grad_norm": 0.3845046248072148,
"learning_rate": 3.561636880204573e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09657958149909973,
"step": 2525,
"valid_targets_mean": 7640.8,
"valid_targets_min": 5248
},
{
"epoch": 2.0586080586080584,
"grad_norm": 0.37913655017775,
"learning_rate": 3.559098489217048e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10077941417694092,
"step": 2530,
"valid_targets_mean": 7249.6,
"valid_targets_min": 5217
},
{
"epoch": 2.0626780626780628,
"grad_norm": 0.3932696577304994,
"learning_rate": 3.556553680124463e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11539335548877716,
"step": 2535,
"valid_targets_mean": 7619.9,
"valid_targets_min": 5094
},
{
"epoch": 2.0667480667480667,
"grad_norm": 0.4553738196822326,
"learning_rate": 3.554002463402651e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09798746556043625,
"step": 2540,
"valid_targets_mean": 7732.8,
"valid_targets_min": 5842
},
{
"epoch": 2.070818070818071,
"grad_norm": 0.3421874470170016,
"learning_rate": 3.55144484955382e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10603936016559601,
"step": 2545,
"valid_targets_mean": 7952.9,
"valid_targets_min": 5494
},
{
"epoch": 2.074888074888075,
"grad_norm": 0.411703732721423,
"learning_rate": 3.5488808491065115e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11069735139608383,
"step": 2550,
"valid_targets_mean": 8001.0,
"valid_targets_min": 5454
},
{
"epoch": 2.078958078958079,
"grad_norm": 0.4858270959003259,
"learning_rate": 3.546310472615559e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07974497973918915,
"step": 2555,
"valid_targets_mean": 2985.1,
"valid_targets_min": 1896
},
{
"epoch": 2.083028083028083,
"grad_norm": 0.36276165908540825,
"learning_rate": 3.5437337306620426e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0890931487083435,
"step": 2560,
"valid_targets_mean": 6714.6,
"valid_targets_min": 4917
},
{
"epoch": 2.087098087098087,
"grad_norm": 0.38710060664879364,
"learning_rate": 3.5411506338532467e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11066673696041107,
"step": 2565,
"valid_targets_mean": 7595.2,
"valid_targets_min": 5488
},
{
"epoch": 2.091168091168091,
"grad_norm": 0.42287295340468783,
"learning_rate": 3.538561192822616e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11034491658210754,
"step": 2570,
"valid_targets_mean": 7046.1,
"valid_targets_min": 5579
},
{
"epoch": 2.0952380952380953,
"grad_norm": 0.39997010448045195,
"learning_rate": 3.535965418229709e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10264366120100021,
"step": 2575,
"valid_targets_mean": 7108.0,
"valid_targets_min": 4963
},
{
"epoch": 2.0993080993080993,
"grad_norm": 0.389640401517337,
"learning_rate": 3.53336332076016e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10438866168260574,
"step": 2580,
"valid_targets_mean": 6810.1,
"valid_targets_min": 5666
},
{
"epoch": 2.1033781033781036,
"grad_norm": 0.36942338263571345,
"learning_rate": 3.530754911125631e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09709086269140244,
"step": 2585,
"valid_targets_mean": 8068.5,
"valid_targets_min": 5524
},
{
"epoch": 2.1074481074481075,
"grad_norm": 0.4068615598584502,
"learning_rate": 3.528140200063766e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08543336391448975,
"step": 2590,
"valid_targets_mean": 6553.8,
"valid_targets_min": 3621
},
{
"epoch": 2.1115181115181114,
"grad_norm": 0.363276338830108,
"learning_rate": 3.525519198338152e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09692707657814026,
"step": 2595,
"valid_targets_mean": 6762.5,
"valid_targets_min": 4968
},
{
"epoch": 2.1155881155881158,
"grad_norm": 0.40355801888377707,
"learning_rate": 3.522891916738269e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09964744746685028,
"step": 2600,
"valid_targets_mean": 6143.9,
"valid_targets_min": 4917
},
{
"epoch": 2.1196581196581197,
"grad_norm": 0.5117847968390805,
"learning_rate": 3.520258366079451e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14205092191696167,
"step": 2605,
"valid_targets_mean": 4583.8,
"valid_targets_min": 215
},
{
"epoch": 2.1237281237281236,
"grad_norm": 0.3623495414988248,
"learning_rate": 3.5176185572028396e-05,
"loss": 0.2115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10662650316953659,
"step": 2610,
"valid_targets_mean": 7317.1,
"valid_targets_min": 4948
},
{
"epoch": 2.127798127798128,
"grad_norm": 0.4038325996304427,
"learning_rate": 3.514972500975334e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10691466927528381,
"step": 2615,
"valid_targets_mean": 6437.6,
"valid_targets_min": 4510
},
{
"epoch": 2.131868131868132,
"grad_norm": 0.41453320525991616,
"learning_rate": 3.512320208289556e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11678023636341095,
"step": 2620,
"valid_targets_mean": 7707.9,
"valid_targets_min": 5796
},
{
"epoch": 2.1359381359381358,
"grad_norm": 0.3827950421697951,
"learning_rate": 3.509661690063796e-05,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10019416362047195,
"step": 2625,
"valid_targets_mean": 7900.9,
"valid_targets_min": 5643
},
{
"epoch": 2.14000814000814,
"grad_norm": 0.4162389900061376,
"learning_rate": 3.506996957241975e-05,
"loss": 0.2082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11353873461484909,
"step": 2630,
"valid_targets_mean": 7627.2,
"valid_targets_min": 5742
},
{
"epoch": 2.144078144078144,
"grad_norm": 0.37061577197439505,
"learning_rate": 3.5043260207935964e-05,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12082710862159729,
"step": 2635,
"valid_targets_mean": 8725.6,
"valid_targets_min": 5141
},
{
"epoch": 2.148148148148148,
"grad_norm": 0.3989344474846749,
"learning_rate": 3.5016488917137005e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11526183038949966,
"step": 2640,
"valid_targets_mean": 6967.8,
"valid_targets_min": 6088
},
{
"epoch": 2.1522181522181523,
"grad_norm": 0.3765813295326696,
"learning_rate": 3.4989655810228185e-05,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09672106802463531,
"step": 2645,
"valid_targets_mean": 7140.1,
"valid_targets_min": 4834
},
{
"epoch": 2.156288156288156,
"grad_norm": 0.4244375123230793,
"learning_rate": 3.496276099766932e-05,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09745915234088898,
"step": 2650,
"valid_targets_mean": 6706.9,
"valid_targets_min": 5108
},
{
"epoch": 2.1603581603581605,
"grad_norm": 0.41712309629614364,
"learning_rate": 3.493580459017419e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1050487756729126,
"step": 2655,
"valid_targets_mean": 5931.4,
"valid_targets_min": 4708
},
{
"epoch": 2.1644281644281644,
"grad_norm": 0.36084098571878304,
"learning_rate": 3.4908786698710196e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09638667106628418,
"step": 2660,
"valid_targets_mean": 7145.6,
"valid_targets_min": 5280
},
{
"epoch": 2.1684981684981683,
"grad_norm": 0.660596763158056,
"learning_rate": 3.488170743449779e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06803116202354431,
"step": 2665,
"valid_targets_mean": 1554.9,
"valid_targets_min": 592
},
{
"epoch": 2.1725681725681727,
"grad_norm": 0.4482747012803121,
"learning_rate": 3.4854566909010074e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11789162456989288,
"step": 2670,
"valid_targets_mean": 7069.5,
"valid_targets_min": 4765
},
{
"epoch": 2.1766381766381766,
"grad_norm": 0.3901951315778572,
"learning_rate": 3.482736523397237e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10189478099346161,
"step": 2675,
"valid_targets_mean": 6193.4,
"valid_targets_min": 5587
},
{
"epoch": 2.1807081807081805,
"grad_norm": 0.42745988843150207,
"learning_rate": 3.4800102521361686e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10757580399513245,
"step": 2680,
"valid_targets_mean": 6612.2,
"valid_targets_min": 4894
},
{
"epoch": 2.184778184778185,
"grad_norm": 0.36920716366061657,
"learning_rate": 3.477277888340631e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09517497569322586,
"step": 2685,
"valid_targets_mean": 6605.9,
"valid_targets_min": 3795
},
{
"epoch": 2.1888481888481888,
"grad_norm": 0.3841241265624308,
"learning_rate": 3.474539443258534e-05,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10367844998836517,
"step": 2690,
"valid_targets_mean": 7186.8,
"valid_targets_min": 4890
},
{
"epoch": 2.192918192918193,
"grad_norm": 0.412689694061922,
"learning_rate": 3.47179492816282e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10491199791431427,
"step": 2695,
"valid_targets_mean": 6544.4,
"valid_targets_min": 4615
},
{
"epoch": 2.196988196988197,
"grad_norm": 0.4079072132791562,
"learning_rate": 3.4690443543514195e-05,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1100861206650734,
"step": 2700,
"valid_targets_mean": 6339.2,
"valid_targets_min": 4798
},
{
"epoch": 2.201058201058201,
"grad_norm": 0.49329598417369225,
"learning_rate": 3.466287733147204e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11788356304168701,
"step": 2705,
"valid_targets_mean": 4558.8,
"valid_targets_min": 148
},
{
"epoch": 2.2051282051282053,
"grad_norm": 0.4145578788267481,
"learning_rate": 3.463525075897939e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11438199877738953,
"step": 2710,
"valid_targets_mean": 6807.9,
"valid_targets_min": 5164
},
{
"epoch": 2.209198209198209,
"grad_norm": 0.4801367983090269,
"learning_rate": 3.4607563939762376e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10205637663602829,
"step": 2715,
"valid_targets_mean": 7011.8,
"valid_targets_min": 4974
},
{
"epoch": 2.213268213268213,
"grad_norm": 0.3925286843177837,
"learning_rate": 3.4579816987795153e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09270621836185455,
"step": 2720,
"valid_targets_mean": 5794.2,
"valid_targets_min": 4809
},
{
"epoch": 2.2173382173382175,
"grad_norm": 0.407243764629195,
"learning_rate": 3.45520100172994e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09255869686603546,
"step": 2725,
"valid_targets_mean": 6401.8,
"valid_targets_min": 4842
},
{
"epoch": 2.2214082214082214,
"grad_norm": 0.42364061860080554,
"learning_rate": 3.452414314274386e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10335355252027512,
"step": 2730,
"valid_targets_mean": 6182.1,
"valid_targets_min": 5116
},
{
"epoch": 2.2254782254782253,
"grad_norm": 0.3622471152141575,
"learning_rate": 3.449621647884389e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09193432331085205,
"step": 2735,
"valid_targets_mean": 6165.1,
"valid_targets_min": 5764
},
{
"epoch": 2.2295482295482296,
"grad_norm": 0.7288165001567957,
"learning_rate": 3.446823014056096e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08235251158475876,
"step": 2740,
"valid_targets_mean": 1428.2,
"valid_targets_min": 1062
},
{
"epoch": 2.2336182336182335,
"grad_norm": 0.7611801465102082,
"learning_rate": 3.444018424310221e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0987827330827713,
"step": 2745,
"valid_targets_mean": 1663.0,
"valid_targets_min": 960
},
{
"epoch": 2.237688237688238,
"grad_norm": 0.7650679543370236,
"learning_rate": 3.441207890191993e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09653256833553314,
"step": 2750,
"valid_targets_mean": 1476.5,
"valid_targets_min": 933
},
{
"epoch": 2.241758241758242,
"grad_norm": 0.83957302169369,
"learning_rate": 3.438391423271115e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0952417328953743,
"step": 2755,
"valid_targets_mean": 1478.1,
"valid_targets_min": 881
},
{
"epoch": 2.2458282458282457,
"grad_norm": 0.8264299057033202,
"learning_rate": 3.435569035141708e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11602550745010376,
"step": 2760,
"valid_targets_mean": 1640.6,
"valid_targets_min": 869
},
{
"epoch": 2.24989824989825,
"grad_norm": 0.8302853801654866,
"learning_rate": 3.4327407374222726e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10423608124256134,
"step": 2765,
"valid_targets_mean": 1709.0,
"valid_targets_min": 1090
},
{
"epoch": 2.253968253968254,
"grad_norm": 0.7943422274719701,
"learning_rate": 3.429906541755633e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07585322856903076,
"step": 2770,
"valid_targets_mean": 1157.9,
"valid_targets_min": 761
},
{
"epoch": 2.258038258038258,
"grad_norm": 0.7565321550178822,
"learning_rate": 3.427066459808896e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09391198307275772,
"step": 2775,
"valid_targets_mean": 1553.6,
"valid_targets_min": 1241
},
{
"epoch": 2.262108262108262,
"grad_norm": 0.7572888191925212,
"learning_rate": 3.4242205032733964e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.089296355843544,
"step": 2780,
"valid_targets_mean": 1538.1,
"valid_targets_min": 733
},
{
"epoch": 2.266178266178266,
"grad_norm": 0.7064148997241197,
"learning_rate": 3.421368683864653e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05855751782655716,
"step": 2785,
"valid_targets_mean": 1250.6,
"valid_targets_min": 835
},
{
"epoch": 2.2702482702482705,
"grad_norm": 0.8701439644199427,
"learning_rate": 3.41851101332232e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1104547530412674,
"step": 2790,
"valid_targets_mean": 1596.2,
"valid_targets_min": 1046
},
{
"epoch": 2.2743182743182744,
"grad_norm": 0.7800184045885545,
"learning_rate": 3.4156475034101366e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09086226671934128,
"step": 2795,
"valid_targets_mean": 1646.5,
"valid_targets_min": 797
},
{
"epoch": 2.2783882783882783,
"grad_norm": 0.7543167696467623,
"learning_rate": 3.4127781659158834e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09387262165546417,
"step": 2800,
"valid_targets_mean": 1448.9,
"valid_targets_min": 570
},
{
"epoch": 2.2824582824582826,
"grad_norm": 0.7308404855311503,
"learning_rate": 3.409903012651327e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06849798560142517,
"step": 2805,
"valid_targets_mean": 1164.1,
"valid_targets_min": 548
},
{
"epoch": 2.2865282865282865,
"grad_norm": 0.8596378098769865,
"learning_rate": 3.407022055452176e-05,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09337285161018372,
"step": 2810,
"valid_targets_mean": 1338.0,
"valid_targets_min": 682
},
{
"epoch": 2.2905982905982905,
"grad_norm": 0.7766417971092897,
"learning_rate": 3.404135306178032e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09825626015663147,
"step": 2815,
"valid_targets_mean": 1632.8,
"valid_targets_min": 896
},
{
"epoch": 2.294668294668295,
"grad_norm": 0.7789615600939394,
"learning_rate": 3.401242776712339e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12328001856803894,
"step": 2820,
"valid_targets_mean": 1806.5,
"valid_targets_min": 597
},
{
"epoch": 2.2987382987382987,
"grad_norm": 0.7920477301948577,
"learning_rate": 3.3983444789623356e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08308230340480804,
"step": 2825,
"valid_targets_mean": 1289.9,
"valid_targets_min": 706
},
{
"epoch": 2.3028083028083026,
"grad_norm": 0.8975491925387518,
"learning_rate": 3.395440424859007e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06022972613573074,
"step": 2830,
"valid_targets_mean": 1354.1,
"valid_targets_min": 754
},
{
"epoch": 2.306878306878307,
"grad_norm": 0.7130180704385317,
"learning_rate": 3.3925306263570316e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08599118888378143,
"step": 2835,
"valid_targets_mean": 1461.9,
"valid_targets_min": 819
},
{
"epoch": 2.310948310948311,
"grad_norm": 0.7039318125811921,
"learning_rate": 3.389615095434739e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07211598753929138,
"step": 2840,
"valid_targets_mean": 1225.5,
"valid_targets_min": 684
},
{
"epoch": 2.315018315018315,
"grad_norm": 0.9104668810680625,
"learning_rate": 3.386693844094055e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09691354632377625,
"step": 2845,
"valid_targets_mean": 1282.2,
"valid_targets_min": 711
},
{
"epoch": 2.319088319088319,
"grad_norm": 0.7159321952742587,
"learning_rate": 3.3837668843604506e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09997346997261047,
"step": 2850,
"valid_targets_mean": 1634.8,
"valid_targets_min": 1190
},
{
"epoch": 2.323158323158323,
"grad_norm": 0.7393893216811349,
"learning_rate": 3.380834228282901e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09477157890796661,
"step": 2855,
"valid_targets_mean": 1615.9,
"valid_targets_min": 774
},
{
"epoch": 2.3272283272283274,
"grad_norm": 0.6968353858472797,
"learning_rate": 3.377895887933828e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09568726271390915,
"step": 2860,
"valid_targets_mean": 1848.4,
"valid_targets_min": 734
},
{
"epoch": 2.3312983312983313,
"grad_norm": 0.792449089844968,
"learning_rate": 3.374951875409052e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09505010396242142,
"step": 2865,
"valid_targets_mean": 1570.6,
"valid_targets_min": 1011
},
{
"epoch": 2.335368335368335,
"grad_norm": 0.8817699677604942,
"learning_rate": 3.372002202827744e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10640811175107956,
"step": 2870,
"valid_targets_mean": 1697.0,
"valid_targets_min": 803
},
{
"epoch": 2.3394383394383396,
"grad_norm": 0.8000585484054449,
"learning_rate": 3.369046882332376e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0811472162604332,
"step": 2875,
"valid_targets_mean": 1307.1,
"valid_targets_min": 782
},
{
"epoch": 2.3435083435083435,
"grad_norm": 0.7232841587277343,
"learning_rate": 3.36608592608867e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09704796224832535,
"step": 2880,
"valid_targets_mean": 1596.6,
"valid_targets_min": 646
},
{
"epoch": 2.347578347578348,
"grad_norm": 0.75091103368943,
"learning_rate": 3.363119346285546e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1288718581199646,
"step": 2885,
"valid_targets_mean": 1817.5,
"valid_targets_min": 922
},
{
"epoch": 2.3516483516483517,
"grad_norm": 0.7628714260858689,
"learning_rate": 3.360147155135074e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10485200583934784,
"step": 2890,
"valid_targets_mean": 1822.2,
"valid_targets_min": 796
},
{
"epoch": 2.3557183557183556,
"grad_norm": 0.7313328666663071,
"learning_rate": 3.3571693648724255e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09335388988256454,
"step": 2895,
"valid_targets_mean": 1542.4,
"valid_targets_min": 903
},
{
"epoch": 2.35978835978836,
"grad_norm": 0.7976060703436042,
"learning_rate": 3.354185987755818e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10187899321317673,
"step": 2900,
"valid_targets_mean": 1459.5,
"valid_targets_min": 780
},
{
"epoch": 2.363858363858364,
"grad_norm": 0.7155507200782179,
"learning_rate": 3.35119703606647e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09475696831941605,
"step": 2905,
"valid_targets_mean": 1581.1,
"valid_targets_min": 783
},
{
"epoch": 2.367928367928368,
"grad_norm": 0.7284814264168356,
"learning_rate": 3.3482025221085476e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07198642194271088,
"step": 2910,
"valid_targets_mean": 1342.1,
"valid_targets_min": 662
},
{
"epoch": 2.371998371998372,
"grad_norm": 0.7533633677117174,
"learning_rate": 3.345202458209112e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08188924193382263,
"step": 2915,
"valid_targets_mean": 1269.1,
"valid_targets_min": 724
},
{
"epoch": 2.376068376068376,
"grad_norm": 0.7522234550738248,
"learning_rate": 3.342196856718074e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0987510234117508,
"step": 2920,
"valid_targets_mean": 1510.1,
"valid_targets_min": 966
},
{
"epoch": 2.38013838013838,
"grad_norm": 0.7796084834753764,
"learning_rate": 3.339185730008138e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07946356385946274,
"step": 2925,
"valid_targets_mean": 1327.8,
"valid_targets_min": 773
},
{
"epoch": 2.3842083842083843,
"grad_norm": 1.1234420570664228,
"learning_rate": 3.336169090474756e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07645580172538757,
"step": 2930,
"valid_targets_mean": 1353.2,
"valid_targets_min": 807
},
{
"epoch": 2.3882783882783882,
"grad_norm": 0.8228399599394453,
"learning_rate": 3.333146950536069e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06878844648599625,
"step": 2935,
"valid_targets_mean": 1142.5,
"valid_targets_min": 782
},
{
"epoch": 2.392348392348392,
"grad_norm": 0.761793565454502,
"learning_rate": 3.330119322632866e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10029375553131104,
"step": 2940,
"valid_targets_mean": 1849.9,
"valid_targets_min": 634
},
{
"epoch": 2.3964183964183965,
"grad_norm": 0.7748556030785365,
"learning_rate": 3.327086219228525e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09164921939373016,
"step": 2945,
"valid_targets_mean": 1599.6,
"valid_targets_min": 573
},
{
"epoch": 2.4004884004884004,
"grad_norm": 0.6823141885908128,
"learning_rate": 3.324047652808963e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10002493113279343,
"step": 2950,
"valid_targets_mean": 1994.9,
"valid_targets_min": 1102
},
{
"epoch": 2.4045584045584047,
"grad_norm": 0.7203959180089063,
"learning_rate": 3.321003635882588e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06791776418685913,
"step": 2955,
"valid_targets_mean": 1239.2,
"valid_targets_min": 841
},
{
"epoch": 2.4086284086284087,
"grad_norm": 0.8522458805730017,
"learning_rate": 3.3179541809802436e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0885857418179512,
"step": 2960,
"valid_targets_mean": 1467.5,
"valid_targets_min": 956
},
{
"epoch": 2.4126984126984126,
"grad_norm": 0.8485280697833679,
"learning_rate": 3.31489930065516e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09528080374002457,
"step": 2965,
"valid_targets_mean": 1300.9,
"valid_targets_min": 857
},
{
"epoch": 2.416768416768417,
"grad_norm": 0.702328495769866,
"learning_rate": 3.311839007482902e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09654178470373154,
"step": 2970,
"valid_targets_mean": 1389.8,
"valid_targets_min": 808
},
{
"epoch": 2.420838420838421,
"grad_norm": 0.7498418061623674,
"learning_rate": 3.308773314061315e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0779038816690445,
"step": 2975,
"valid_targets_mean": 1303.8,
"valid_targets_min": 677
},
{
"epoch": 2.4249084249084247,
"grad_norm": 0.7339750048913246,
"learning_rate": 3.3057022330104764e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0759783387184143,
"step": 2980,
"valid_targets_mean": 1220.1,
"valid_targets_min": 727
},
{
"epoch": 2.428978428978429,
"grad_norm": 0.7678673826329332,
"learning_rate": 3.30262577697264e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07477933913469315,
"step": 2985,
"valid_targets_mean": 1262.0,
"valid_targets_min": 726
},
{
"epoch": 2.433048433048433,
"grad_norm": 0.7882443666752398,
"learning_rate": 3.299543958612188e-05,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10648937523365021,
"step": 2990,
"valid_targets_mean": 1615.0,
"valid_targets_min": 669
},
{
"epoch": 2.4371184371184373,
"grad_norm": 0.7375257054384906,
"learning_rate": 3.2964567906155775e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10215851664543152,
"step": 2995,
"valid_targets_mean": 1806.5,
"valid_targets_min": 792
},
{
"epoch": 2.4411884411884412,
"grad_norm": 0.7644653496961722,
"learning_rate": 3.293364285691284e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09152808785438538,
"step": 3000,
"valid_targets_mean": 1627.6,
"valid_targets_min": 736
},
{
"epoch": 2.445258445258445,
"grad_norm": 0.836057897371144,
"learning_rate": 3.290266456569756e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12586501240730286,
"step": 3005,
"valid_targets_mean": 1822.9,
"valid_targets_min": 694
},
{
"epoch": 2.4493284493284495,
"grad_norm": 0.7684573774704392,
"learning_rate": 3.2871633160033596e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11305080354213715,
"step": 3010,
"valid_targets_mean": 1848.9,
"valid_targets_min": 1437
},
{
"epoch": 2.4533984533984534,
"grad_norm": 0.7722426718287829,
"learning_rate": 3.2840548767663226e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11125504225492477,
"step": 3015,
"valid_targets_mean": 1852.4,
"valid_targets_min": 809
},
{
"epoch": 2.4574684574684573,
"grad_norm": 0.8693277147754886,
"learning_rate": 3.2809411516546876e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0825982391834259,
"step": 3020,
"valid_targets_mean": 1375.5,
"valid_targets_min": 790
},
{
"epoch": 2.4615384615384617,
"grad_norm": 0.8569411244780402,
"learning_rate": 3.2778221534862554e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08256229013204575,
"step": 3025,
"valid_targets_mean": 1338.8,
"valid_targets_min": 750
},
{
"epoch": 2.4656084656084656,
"grad_norm": 0.8496633562930437,
"learning_rate": 3.274697895100536e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11016149818897247,
"step": 3030,
"valid_targets_mean": 1778.8,
"valid_targets_min": 826
},
{
"epoch": 2.4696784696784695,
"grad_norm": 0.7550200846250567,
"learning_rate": 3.2715683893586904e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08121539652347565,
"step": 3035,
"valid_targets_mean": 1600.8,
"valid_targets_min": 907
},
{
"epoch": 2.473748473748474,
"grad_norm": 0.7407812428035063,
"learning_rate": 3.2684336491434814e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09471592307090759,
"step": 3040,
"valid_targets_mean": 1474.5,
"valid_targets_min": 1093
},
{
"epoch": 2.4778184778184777,
"grad_norm": 1.167858594983234,
"learning_rate": 3.2652936873592206e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09139646589756012,
"step": 3045,
"valid_targets_mean": 1577.2,
"valid_targets_min": 1119
},
{
"epoch": 2.4818884818884817,
"grad_norm": 0.7675583595322624,
"learning_rate": 3.262148516931714e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10131756961345673,
"step": 3050,
"valid_targets_mean": 1512.1,
"valid_targets_min": 700
},
{
"epoch": 2.485958485958486,
"grad_norm": 0.7516413523459232,
"learning_rate": 3.25899815080821e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07350552827119827,
"step": 3055,
"valid_targets_mean": 1288.2,
"valid_targets_min": 810
},
{
"epoch": 2.49002849002849,
"grad_norm": 0.9663636034775042,
"learning_rate": 3.2558426019573435e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0857287123799324,
"step": 3060,
"valid_targets_mean": 1328.9,
"valid_targets_min": 635
},
{
"epoch": 2.4940984940984943,
"grad_norm": 0.7525509366960841,
"learning_rate": 3.2526818833690855e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10586247593164444,
"step": 3065,
"valid_targets_mean": 1542.5,
"valid_targets_min": 673
},
{
"epoch": 2.498168498168498,
"grad_norm": 0.8552319935455616,
"learning_rate": 3.2495160080546895e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09937754273414612,
"step": 3070,
"valid_targets_mean": 1215.6,
"valid_targets_min": 641
},
{
"epoch": 2.502238502238502,
"grad_norm": 0.7825010890917209,
"learning_rate": 3.246344989046635e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07913076877593994,
"step": 3075,
"valid_targets_mean": 1222.6,
"valid_targets_min": 701
},
{
"epoch": 2.5063085063085064,
"grad_norm": 0.7499645512602379,
"learning_rate": 3.243168839398576e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09814945608377457,
"step": 3080,
"valid_targets_mean": 1850.6,
"valid_targets_min": 1202
},
{
"epoch": 2.5103785103785103,
"grad_norm": 0.7240473408886264,
"learning_rate": 3.239987572185288e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06967031210660934,
"step": 3085,
"valid_targets_mean": 1265.5,
"valid_targets_min": 657
},
{
"epoch": 2.5144485144485147,
"grad_norm": 0.7723805357606571,
"learning_rate": 3.2368012005026136e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08349703252315521,
"step": 3090,
"valid_targets_mean": 1388.0,
"valid_targets_min": 672
},
{
"epoch": 2.5185185185185186,
"grad_norm": 0.740778910182572,
"learning_rate": 3.233609737467407e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10719085484743118,
"step": 3095,
"valid_targets_mean": 1813.6,
"valid_targets_min": 1019
},
{
"epoch": 2.5225885225885225,
"grad_norm": 0.7925251844992214,
"learning_rate": 3.2304131962174804e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0703994482755661,
"step": 3100,
"valid_targets_mean": 1114.6,
"valid_targets_min": 732
},
{
"epoch": 2.526658526658527,
"grad_norm": 0.7739162778424586,
"learning_rate": 3.227211589911554e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06456971168518066,
"step": 3105,
"valid_targets_mean": 1194.5,
"valid_targets_min": 634
},
{
"epoch": 2.5307285307285308,
"grad_norm": 0.6811693756020172,
"learning_rate": 3.224004931729195e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0884883850812912,
"step": 3110,
"valid_targets_mean": 1756.5,
"valid_targets_min": 905
},
{
"epoch": 2.5347985347985347,
"grad_norm": 1.2605982496459476,
"learning_rate": 3.220793234870769e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10120239853858948,
"step": 3115,
"valid_targets_mean": 1554.9,
"valid_targets_min": 596
},
{
"epoch": 2.538868538868539,
"grad_norm": 0.7456047283707952,
"learning_rate": 3.217576512557383e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07132766395807266,
"step": 3120,
"valid_targets_mean": 1214.6,
"valid_targets_min": 687
},
{
"epoch": 2.542938542938543,
"grad_norm": 0.7668765276856079,
"learning_rate": 3.214354778030831e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10113206505775452,
"step": 3125,
"valid_targets_mean": 1955.1,
"valid_targets_min": 1199
},
{
"epoch": 2.547008547008547,
"grad_norm": 0.6688254932482489,
"learning_rate": 3.211128044553542e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08862347900867462,
"step": 3130,
"valid_targets_mean": 1758.6,
"valid_targets_min": 1214
},
{
"epoch": 2.551078551078551,
"grad_norm": 0.7105824934530232,
"learning_rate": 3.2078963254085186e-05,
"loss": 0.1713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09190790355205536,
"step": 3135,
"valid_targets_mean": 1711.5,
"valid_targets_min": 1122
},
{
"epoch": 2.555148555148555,
"grad_norm": 1.574075103571208,
"learning_rate": 3.2046596338992934e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08651512861251831,
"step": 3140,
"valid_targets_mean": 1489.6,
"valid_targets_min": 850
},
{
"epoch": 2.559218559218559,
"grad_norm": 0.7171578485312335,
"learning_rate": 3.201417983349865e-05,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07850717753171921,
"step": 3145,
"valid_targets_mean": 1572.4,
"valid_targets_min": 1318
},
{
"epoch": 2.5632885632885634,
"grad_norm": 0.784020145965083,
"learning_rate": 3.198171387104645e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09676879644393921,
"step": 3150,
"valid_targets_mean": 1500.0,
"valid_targets_min": 1043
},
{
"epoch": 2.5673585673585673,
"grad_norm": 0.7023031187317561,
"learning_rate": 3.194919858528405e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10829615592956543,
"step": 3155,
"valid_targets_mean": 1774.9,
"valid_targets_min": 920
},
{
"epoch": 2.571428571428571,
"grad_norm": 0.7266495375892049,
"learning_rate": 3.191663411006222e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09090869128704071,
"step": 3160,
"valid_targets_mean": 1547.1,
"valid_targets_min": 847
},
{
"epoch": 2.5754985754985755,
"grad_norm": 0.7082754020615566,
"learning_rate": 3.1884020579434216e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09622791409492493,
"step": 3165,
"valid_targets_mean": 1769.4,
"valid_targets_min": 738
},
{
"epoch": 2.5795685795685794,
"grad_norm": 0.7671758979055356,
"learning_rate": 3.1851358127655214e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09749025106430054,
"step": 3170,
"valid_targets_mean": 1540.1,
"valid_targets_min": 594
},
{
"epoch": 2.583638583638584,
"grad_norm": 0.646884294048327,
"learning_rate": 3.1818646889181815e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09275157749652863,
"step": 3175,
"valid_targets_mean": 2228.6,
"valid_targets_min": 1393
},
{
"epoch": 2.5877085877085877,
"grad_norm": 0.43091544980003527,
"learning_rate": 3.1785886998671406e-05,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07351458072662354,
"step": 3180,
"valid_targets_mean": 3981.9,
"valid_targets_min": 3545
},
{
"epoch": 2.591778591778592,
"grad_norm": 0.40608611395729444,
"learning_rate": 3.1753078590981697e-05,
"loss": 0.1094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053135018795728683,
"step": 3185,
"valid_targets_mean": 2837.8,
"valid_targets_min": 1024
},
{
"epoch": 2.595848595848596,
"grad_norm": 0.2970617855486435,
"learning_rate": 3.1720221801170076e-05,
"loss": 0.0971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029508689418435097,
"step": 3190,
"valid_targets_mean": 3453.5,
"valid_targets_min": 3026
},
{
"epoch": 2.5999185999186,
"grad_norm": 0.4040679062651357,
"learning_rate": 3.1687316764493145e-05,
"loss": 0.1199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06386222690343857,
"step": 3195,
"valid_targets_mean": 3272.8,
"valid_targets_min": 2213
},
{
"epoch": 2.603988603988604,
"grad_norm": 0.42140297889686756,
"learning_rate": 3.165436361640608e-05,
"loss": 0.0958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06314370036125183,
"step": 3200,
"valid_targets_mean": 3111.5,
"valid_targets_min": 1134
},
{
"epoch": 2.608058608058608,
"grad_norm": 0.4318510588456392,
"learning_rate": 3.162136249256214e-05,
"loss": 0.1067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06179654225707054,
"step": 3205,
"valid_targets_mean": 2179.2,
"valid_targets_min": 663
},
{
"epoch": 2.612128612128612,
"grad_norm": 0.6151866793044011,
"learning_rate": 3.158831352881204e-05,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06750689446926117,
"step": 3210,
"valid_targets_mean": 2128.4,
"valid_targets_min": 535
},
{
"epoch": 2.6161986161986164,
"grad_norm": 0.4023184284236594,
"learning_rate": 3.1555216861203466e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04353209584951401,
"step": 3215,
"valid_targets_mean": 1964.0,
"valid_targets_min": 811
},
{
"epoch": 2.6202686202686203,
"grad_norm": 0.4367154826598129,
"learning_rate": 3.1522072625980466e-05,
"loss": 0.1231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07076150923967361,
"step": 3220,
"valid_targets_mean": 2673.8,
"valid_targets_min": 1498
},
{
"epoch": 2.624338624338624,
"grad_norm": 0.24902381526805464,
"learning_rate": 3.1488880959582905e-05,
"loss": 0.1221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03554770350456238,
"step": 3225,
"valid_targets_mean": 4407.2,
"valid_targets_min": 3285
},
{
"epoch": 2.6284086284086285,
"grad_norm": 0.2979605188474624,
"learning_rate": 3.14556419986459e-05,
"loss": 0.0961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05047299340367317,
"step": 3230,
"valid_targets_mean": 3491.2,
"valid_targets_min": 1048
},
{
"epoch": 2.6324786324786325,
"grad_norm": 0.3571486698231609,
"learning_rate": 3.142235587999924e-05,
"loss": 0.1024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05532723292708397,
"step": 3235,
"valid_targets_mean": 2983.9,
"valid_targets_min": 1290
},
{
"epoch": 2.6365486365486364,
"grad_norm": 0.4898779952522662,
"learning_rate": 3.138902274066688e-05,
"loss": 0.0993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058787234127521515,
"step": 3240,
"valid_targets_mean": 2018.6,
"valid_targets_min": 720
},
{
"epoch": 2.6406186406186407,
"grad_norm": 0.3257155158788977,
"learning_rate": 3.13556427178663e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05110851302742958,
"step": 3245,
"valid_targets_mean": 3854.4,
"valid_targets_min": 2336
},
{
"epoch": 2.6446886446886446,
"grad_norm": 0.34560277752942015,
"learning_rate": 3.1322215949008e-05,
"loss": 0.093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04530660808086395,
"step": 3250,
"valid_targets_mean": 2544.9,
"valid_targets_min": 782
},
{
"epoch": 2.6487586487586485,
"grad_norm": 0.39091465479047305,
"learning_rate": 3.1288742571694905e-05,
"loss": 0.1043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036396391689777374,
"step": 3255,
"valid_targets_mean": 3094.4,
"valid_targets_min": 1086
},
{
"epoch": 2.652828652828653,
"grad_norm": 0.34705120235384473,
"learning_rate": 3.1255222723721815e-05,
"loss": 0.0876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045067206025123596,
"step": 3260,
"valid_targets_mean": 3285.0,
"valid_targets_min": 732
},
{
"epoch": 2.656898656898657,
"grad_norm": 0.537067848663477,
"learning_rate": 3.12216565430748e-05,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0710548609495163,
"step": 3265,
"valid_targets_mean": 1575.8,
"valid_targets_min": 770
},
{
"epoch": 2.6609686609686607,
"grad_norm": 0.39399172193475046,
"learning_rate": 3.118804416793069e-05,
"loss": 0.1081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04866083711385727,
"step": 3270,
"valid_targets_mean": 2609.9,
"valid_targets_min": 592
},
{
"epoch": 2.665038665038665,
"grad_norm": 0.4293292007143029,
"learning_rate": 3.115438573665649e-05,
"loss": 0.12,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055250879377126694,
"step": 3275,
"valid_targets_mean": 3045.1,
"valid_targets_min": 2224
},
{
"epoch": 2.669108669108669,
"grad_norm": 0.39199172279612116,
"learning_rate": 3.112068138780876e-05,
"loss": 0.1163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041924867779016495,
"step": 3280,
"valid_targets_mean": 2729.9,
"valid_targets_min": 511
},
{
"epoch": 2.6731786731786733,
"grad_norm": 0.36149115315511404,
"learning_rate": 3.108693126013308e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056219682097435,
"step": 3285,
"valid_targets_mean": 3708.0,
"valid_targets_min": 2328
},
{
"epoch": 2.677248677248677,
"grad_norm": 0.39693264903199954,
"learning_rate": 3.105313549256352e-05,
"loss": 0.0941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0479307621717453,
"step": 3290,
"valid_targets_mean": 3069.4,
"valid_targets_min": 884
},
{
"epoch": 2.6813186813186816,
"grad_norm": 0.6370107315415748,
"learning_rate": 3.1019294224222015e-05,
"loss": 0.1239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06845805794000626,
"step": 3295,
"valid_targets_mean": 1417.6,
"valid_targets_min": 534
},
{
"epoch": 2.6853886853886855,
"grad_norm": 0.6791334033335826,
"learning_rate": 3.098540759441778e-05,
"loss": 0.1326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0740579143166542,
"step": 3300,
"valid_targets_mean": 1554.2,
"valid_targets_min": 568
},
{
"epoch": 2.6894586894586894,
"grad_norm": 0.40157879779417277,
"learning_rate": 3.0951475742646784e-05,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05114832520484924,
"step": 3305,
"valid_targets_mean": 3759.4,
"valid_targets_min": 2808
},
{
"epoch": 2.6935286935286937,
"grad_norm": 0.48697071062687214,
"learning_rate": 3.0917498808591154e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15444746613502502,
"step": 3310,
"valid_targets_mean": 2962.8,
"valid_targets_min": 652
},
{
"epoch": 2.6975986975986976,
"grad_norm": 0.35131488324463145,
"learning_rate": 3.088347693211861e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05616980791091919,
"step": 3315,
"valid_targets_mean": 4014.0,
"valid_targets_min": 3573
},
{
"epoch": 2.7016687016687015,
"grad_norm": 0.9395914594142927,
"learning_rate": 3.084941025328185e-05,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06727755814790726,
"step": 3320,
"valid_targets_mean": 2568.0,
"valid_targets_min": 822
},
{
"epoch": 2.705738705738706,
"grad_norm": 0.6735134741940402,
"learning_rate": 3.081529891231802e-05,
"loss": 0.1426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18474054336547852,
"step": 3325,
"valid_targets_mean": 2774.0,
"valid_targets_min": 2135
},
{
"epoch": 2.70980870980871,
"grad_norm": 0.3312285374873109,
"learning_rate": 3.078114304964814e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045162081718444824,
"step": 3330,
"valid_targets_mean": 4021.2,
"valid_targets_min": 636
},
{
"epoch": 2.7138787138787137,
"grad_norm": 0.37157549346068147,
"learning_rate": 3.0746942805876474e-05,
"loss": 0.0963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07260533422231674,
"step": 3335,
"valid_targets_mean": 4983.9,
"valid_targets_min": 2733
},
{
"epoch": 2.717948717948718,
"grad_norm": 0.3681236408727857,
"learning_rate": 3.071269832178999e-05,
"loss": 0.1073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06341656297445297,
"step": 3340,
"valid_targets_mean": 4406.2,
"valid_targets_min": 2571
},
{
"epoch": 2.722018722018722,
"grad_norm": 0.30039279390137386,
"learning_rate": 3.0678409738357785e-05,
"loss": 0.1049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0368649959564209,
"step": 3345,
"valid_targets_mean": 3177.5,
"valid_targets_min": 970
},
{
"epoch": 2.726088726088726,
"grad_norm": 0.36018710976640456,
"learning_rate": 3.0644077196730494e-05,
"loss": 0.0974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035121314227581024,
"step": 3350,
"valid_targets_mean": 2699.2,
"valid_targets_min": 748
},
{
"epoch": 2.7301587301587302,
"grad_norm": 0.4353275473221667,
"learning_rate": 3.060970083823969e-05,
"loss": 0.0983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06210782751441002,
"step": 3355,
"valid_targets_mean": 3400.1,
"valid_targets_min": 719
},
{
"epoch": 2.734228734228734,
"grad_norm": 0.482149801452687,
"learning_rate": 3.057528080439734e-05,
"loss": 0.1012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05291946232318878,
"step": 3360,
"valid_targets_mean": 2561.8,
"valid_targets_min": 1820
},
{
"epoch": 2.738298738298738,
"grad_norm": 0.41734213557928257,
"learning_rate": 3.054081723689518e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060540057718753815,
"step": 3365,
"valid_targets_mean": 3014.8,
"valid_targets_min": 950
},
{
"epoch": 2.7423687423687424,
"grad_norm": 0.5192547449781431,
"learning_rate": 3.050631027760418e-05,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06714431941509247,
"step": 3370,
"valid_targets_mean": 3569.5,
"valid_targets_min": 3170
},
{
"epoch": 2.7464387464387463,
"grad_norm": 0.35017994375089784,
"learning_rate": 3.0471760068573926e-05,
"loss": 0.0779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04404710233211517,
"step": 3375,
"valid_targets_mean": 3777.1,
"valid_targets_min": 3122
},
{
"epoch": 2.7505087505087507,
"grad_norm": 0.3637498254659091,
"learning_rate": 3.0437166752032027e-05,
"loss": 0.0901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05123971402645111,
"step": 3380,
"valid_targets_mean": 4054.6,
"valid_targets_min": 3511
},
{
"epoch": 2.7545787545787546,
"grad_norm": 0.3404345345130886,
"learning_rate": 3.0402530470383573e-05,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051291994750499725,
"step": 3385,
"valid_targets_mean": 3485.4,
"valid_targets_min": 792
},
{
"epoch": 2.758648758648759,
"grad_norm": 0.46398708542556194,
"learning_rate": 3.0367851366210507e-05,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05058937892317772,
"step": 3390,
"valid_targets_mean": 2089.2,
"valid_targets_min": 795
},
{
"epoch": 2.762718762718763,
"grad_norm": 0.34745051162795376,
"learning_rate": 3.0333129582271043e-05,
"loss": 0.1277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04806285351514816,
"step": 3395,
"valid_targets_mean": 3405.9,
"valid_targets_min": 1196
},
{
"epoch": 2.7667887667887667,
"grad_norm": 0.4972495007269904,
"learning_rate": 3.029836526149911e-05,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058603860437870026,
"step": 3400,
"valid_targets_mean": 2210.1,
"valid_targets_min": 575
},
{
"epoch": 2.770858770858771,
"grad_norm": 0.6469804675168275,
"learning_rate": 3.0263558547003734e-05,
"loss": 0.1165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08365291357040405,
"step": 3405,
"valid_targets_mean": 1888.6,
"valid_targets_min": 609
},
{
"epoch": 2.774928774928775,
"grad_norm": 0.5555623184854452,
"learning_rate": 3.022870958206845e-05,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04522637277841568,
"step": 3410,
"valid_targets_mean": 1463.1,
"valid_targets_min": 542
},
{
"epoch": 2.778998778998779,
"grad_norm": 0.3659096617640059,
"learning_rate": 3.019381851015072e-05,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043918170034885406,
"step": 3415,
"valid_targets_mean": 3743.8,
"valid_targets_min": 2776
},
{
"epoch": 2.7830687830687832,
"grad_norm": 0.4195904880972671,
"learning_rate": 3.0158885474881354e-05,
"loss": 0.1064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039590660482645035,
"step": 3420,
"valid_targets_mean": 1335.4,
"valid_targets_min": 629
},
{
"epoch": 2.787138787138787,
"grad_norm": 0.5872682399941394,
"learning_rate": 3.0123910620063888e-05,
"loss": 0.1287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05974281579256058,
"step": 3425,
"valid_targets_mean": 3961.1,
"valid_targets_min": 3701
},
{
"epoch": 2.791208791208791,
"grad_norm": 0.42579563457253944,
"learning_rate": 3.008889408967403e-05,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05832969397306442,
"step": 3430,
"valid_targets_mean": 2015.1,
"valid_targets_min": 736
},
{
"epoch": 2.7952787952787954,
"grad_norm": 0.49595139616926265,
"learning_rate": 3.0053836027859024e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08861617743968964,
"step": 3435,
"valid_targets_mean": 2458.6,
"valid_targets_min": 605
},
{
"epoch": 2.7993487993487993,
"grad_norm": 0.31433751021873957,
"learning_rate": 3.0018736578937112e-05,
"loss": 0.0902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03106316737830639,
"step": 3440,
"valid_targets_mean": 2187.8,
"valid_targets_min": 848
},
{
"epoch": 2.8034188034188032,
"grad_norm": 0.30827047949470593,
"learning_rate": 2.9983595887396864e-05,
"loss": 0.0911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04991922527551651,
"step": 3445,
"valid_targets_mean": 5241.1,
"valid_targets_min": 4456
},
{
"epoch": 2.8074888074888076,
"grad_norm": 0.37077247640612376,
"learning_rate": 2.9948414097896678e-05,
"loss": 0.0949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057815488427877426,
"step": 3450,
"valid_targets_mean": 4078.9,
"valid_targets_min": 1864
},
{
"epoch": 2.8115588115588115,
"grad_norm": 0.3475158518838076,
"learning_rate": 2.9913191355264092e-05,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04626894369721413,
"step": 3455,
"valid_targets_mean": 3414.1,
"valid_targets_min": 1361
},
{
"epoch": 2.8156288156288154,
"grad_norm": 0.3999990815443734,
"learning_rate": 2.9877927804495255e-05,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0528426468372345,
"step": 3460,
"valid_targets_mean": 3541.4,
"valid_targets_min": 1814
},
{
"epoch": 2.8196988196988197,
"grad_norm": 0.5010947429743733,
"learning_rate": 2.9842623590754294e-05,
"loss": 0.1171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04774967581033707,
"step": 3465,
"valid_targets_mean": 1152.0,
"valid_targets_min": 716
},
{
"epoch": 2.8237688237688237,
"grad_norm": 0.33526324008830605,
"learning_rate": 2.980727885937272e-05,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04189581423997879,
"step": 3470,
"valid_targets_mean": 3898.9,
"valid_targets_min": 2719
},
{
"epoch": 2.8278388278388276,
"grad_norm": 0.5262205319214922,
"learning_rate": 2.9771893755848857e-05,
"loss": 0.1081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039720356464385986,
"step": 3475,
"valid_targets_mean": 1102.4,
"valid_targets_min": 664
},
{
"epoch": 2.831908831908832,
"grad_norm": 0.3448120952299084,
"learning_rate": 2.97364684258472e-05,
"loss": 0.1029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03923565521836281,
"step": 3480,
"valid_targets_mean": 2702.8,
"valid_targets_min": 1584
},
{
"epoch": 2.835978835978836,
"grad_norm": 0.3424380111555321,
"learning_rate": 2.9701003015197862e-05,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037075385451316833,
"step": 3485,
"valid_targets_mean": 2633.6,
"valid_targets_min": 1003
},
{
"epoch": 2.84004884004884,
"grad_norm": 0.37114327921089785,
"learning_rate": 2.9665497669895926e-05,
"loss": 0.1087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04176440089941025,
"step": 3490,
"valid_targets_mean": 2853.4,
"valid_targets_min": 560
},
{
"epoch": 2.844118844118844,
"grad_norm": 0.35943776778483205,
"learning_rate": 2.962995253610089e-05,
"loss": 0.1022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05177730694413185,
"step": 3495,
"valid_targets_mean": 3300.2,
"valid_targets_min": 1049
},
{
"epoch": 2.8481888481888484,
"grad_norm": 0.46323078254655087,
"learning_rate": 2.9594367760136026e-05,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07231918722391129,
"step": 3500,
"valid_targets_mean": 2829.9,
"valid_targets_min": 1497
},
{
"epoch": 2.8522588522588523,
"grad_norm": 0.4260912091223462,
"learning_rate": 2.955874348848781e-05,
"loss": 0.1006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05701189488172531,
"step": 3505,
"valid_targets_mean": 3187.1,
"valid_targets_min": 825
},
{
"epoch": 2.8563288563288562,
"grad_norm": 0.49909290086865893,
"learning_rate": 2.952307986780528e-05,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06764853000640869,
"step": 3510,
"valid_targets_mean": 2835.8,
"valid_targets_min": 829
},
{
"epoch": 2.8603988603988606,
"grad_norm": 0.45907551992299245,
"learning_rate": 2.9487377044899487e-05,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050722379237413406,
"step": 3515,
"valid_targets_mean": 2051.9,
"valid_targets_min": 650
},
{
"epoch": 2.8644688644688645,
"grad_norm": 0.4353504024468164,
"learning_rate": 2.945163516674284e-05,
"loss": 0.1086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05996803194284439,
"step": 3520,
"valid_targets_mean": 2904.0,
"valid_targets_min": 729
},
{
"epoch": 2.8685388685388684,
"grad_norm": 0.30376720990195905,
"learning_rate": 2.9415854380468523e-05,
"loss": 0.0927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03928172215819359,
"step": 3525,
"valid_targets_mean": 3957.1,
"valid_targets_min": 3408
},
{
"epoch": 2.8726088726088728,
"grad_norm": 0.3136319878421944,
"learning_rate": 2.9380034833369892e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03363402932882309,
"step": 3530,
"valid_targets_mean": 3422.8,
"valid_targets_min": 2543
},
{
"epoch": 2.8766788766788767,
"grad_norm": 0.43540877616440243,
"learning_rate": 2.934417667289986e-05,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061333850026130676,
"step": 3535,
"valid_targets_mean": 2753.1,
"valid_targets_min": 1072
},
{
"epoch": 2.8807488807488806,
"grad_norm": 0.3782032866681542,
"learning_rate": 2.9308280046670306e-05,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046056248247623444,
"step": 3540,
"valid_targets_mean": 2810.2,
"valid_targets_min": 702
},
{
"epoch": 2.884818884818885,
"grad_norm": 0.38282746322202976,
"learning_rate": 2.9272345102451424e-05,
"loss": 0.0974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06318642199039459,
"step": 3545,
"valid_targets_mean": 5088.1,
"valid_targets_min": 976
},
{
"epoch": 2.888888888888889,
"grad_norm": 0.34609048416468996,
"learning_rate": 2.923637198817118e-05,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043254029005765915,
"step": 3550,
"valid_targets_mean": 4085.0,
"valid_targets_min": 484
},
{
"epoch": 2.8929588929588927,
"grad_norm": 0.2674998878729295,
"learning_rate": 2.920036085191466e-05,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03606154024600983,
"step": 3555,
"valid_targets_mean": 4375.1,
"valid_targets_min": 1148
},
{
"epoch": 2.897028897028897,
"grad_norm": 0.4242295936507459,
"learning_rate": 2.9164311841923453e-05,
"loss": 0.0987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07503281533718109,
"step": 3560,
"valid_targets_mean": 4233.1,
"valid_targets_min": 3268
},
{
"epoch": 2.901098901098901,
"grad_norm": 0.3646136002979487,
"learning_rate": 2.9128225106595073e-05,
"loss": 0.0969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050537366420030594,
"step": 3565,
"valid_targets_mean": 3133.2,
"valid_targets_min": 559
},
{
"epoch": 2.905168905168905,
"grad_norm": 0.3850447940122486,
"learning_rate": 2.909210079448233e-05,
"loss": 0.1205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04207482933998108,
"step": 3570,
"valid_targets_mean": 2683.9,
"valid_targets_min": 689
},
{
"epoch": 2.9092389092389093,
"grad_norm": 0.4532382464548252,
"learning_rate": 2.905593905429272e-05,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06049978733062744,
"step": 3575,
"valid_targets_mean": 1883.4,
"valid_targets_min": 616
},
{
"epoch": 2.913308913308913,
"grad_norm": 0.4613149439936778,
"learning_rate": 2.9019740034887812e-05,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053340524435043335,
"step": 3580,
"valid_targets_mean": 2458.2,
"valid_targets_min": 602
},
{
"epoch": 2.9173789173789175,
"grad_norm": 0.3550345526134136,
"learning_rate": 2.898350388528263e-05,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05539257824420929,
"step": 3585,
"valid_targets_mean": 3971.8,
"valid_targets_min": 3551
},
{
"epoch": 2.9214489214489214,
"grad_norm": 0.4104168375230188,
"learning_rate": 2.8947230754645056e-05,
"loss": 0.0957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03185092657804489,
"step": 3590,
"valid_targets_mean": 1747.2,
"valid_targets_min": 596
},
{
"epoch": 2.925518925518926,
"grad_norm": 0.335588797815782,
"learning_rate": 2.891092079229521e-05,
"loss": 0.1003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04076407849788666,
"step": 3595,
"valid_targets_mean": 3301.9,
"valid_targets_min": 799
},
{
"epoch": 2.9295889295889297,
"grad_norm": 0.43098042545889287,
"learning_rate": 2.887457414770482e-05,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058630071580410004,
"step": 3600,
"valid_targets_mean": 3122.6,
"valid_targets_min": 706
},
{
"epoch": 2.9336589336589336,
"grad_norm": 0.44968298408503327,
"learning_rate": 2.883819097049662e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05955217033624649,
"step": 3605,
"valid_targets_mean": 1916.1,
"valid_targets_min": 710
},
{
"epoch": 2.937728937728938,
"grad_norm": 0.3761169572763773,
"learning_rate": 2.880177141044374e-05,
"loss": 0.106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042976461350917816,
"step": 3610,
"valid_targets_mean": 3087.8,
"valid_targets_min": 647
},
{
"epoch": 2.941798941798942,
"grad_norm": 0.49089665811727856,
"learning_rate": 2.8765315617469083e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04839683324098587,
"step": 3615,
"valid_targets_mean": 1806.6,
"valid_targets_min": 716
},
{
"epoch": 2.9458689458689458,
"grad_norm": 0.3819345463527236,
"learning_rate": 2.8728823741644693e-05,
"loss": 0.096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055881187319755554,
"step": 3620,
"valid_targets_mean": 3530.9,
"valid_targets_min": 2920
},
{
"epoch": 2.94993894993895,
"grad_norm": 0.4248398215986827,
"learning_rate": 2.869229593319115e-05,
"loss": 0.0982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05369921028614044,
"step": 3625,
"valid_targets_mean": 2021.4,
"valid_targets_min": 832
},
{
"epoch": 2.954008954008954,
"grad_norm": 0.5366502780379148,
"learning_rate": 2.8655732342476974e-05,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04955916851758957,
"step": 3630,
"valid_targets_mean": 1252.5,
"valid_targets_min": 759
},
{
"epoch": 2.958078958078958,
"grad_norm": 0.3725411467334531,
"learning_rate": 2.8619133120017977e-05,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04662502557039261,
"step": 3635,
"valid_targets_mean": 3125.5,
"valid_targets_min": 756
},
{
"epoch": 2.9621489621489623,
"grad_norm": 0.4735438299144219,
"learning_rate": 2.858249841647663e-05,
"loss": 0.0898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06342704594135284,
"step": 3640,
"valid_targets_mean": 2589.4,
"valid_targets_min": 744
},
{
"epoch": 2.966218966218966,
"grad_norm": 0.3229059404155852,
"learning_rate": 2.8545828382661483e-05,
"loss": 0.0944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03534681349992752,
"step": 3645,
"valid_targets_mean": 2489.9,
"valid_targets_min": 529
},
{
"epoch": 2.97028897028897,
"grad_norm": 0.4160099670775479,
"learning_rate": 2.850912316952653e-05,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06118070334196091,
"step": 3650,
"valid_targets_mean": 3904.1,
"valid_targets_min": 2017
},
{
"epoch": 2.9743589743589745,
"grad_norm": 0.27448891928689173,
"learning_rate": 2.847238292817057e-05,
"loss": 0.0903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03835466504096985,
"step": 3655,
"valid_targets_mean": 4848.6,
"valid_targets_min": 516
},
{
"epoch": 2.9784289784289784,
"grad_norm": 0.3412081869287908,
"learning_rate": 2.8435607809836585e-05,
"loss": 0.0875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03919822350144386,
"step": 3660,
"valid_targets_mean": 2295.4,
"valid_targets_min": 772
},
{
"epoch": 2.9824989824989823,
"grad_norm": 0.369354587305238,
"learning_rate": 2.8398797965911164e-05,
"loss": 0.0966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05215475335717201,
"step": 3665,
"valid_targets_mean": 4149.0,
"valid_targets_min": 2807
},
{
"epoch": 2.9865689865689866,
"grad_norm": 0.4781896046920586,
"learning_rate": 2.836195354792382e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11530614644289017,
"step": 3670,
"valid_targets_mean": 3047.1,
"valid_targets_min": 2759
},
{
"epoch": 2.9906389906389905,
"grad_norm": 0.32100235515429487,
"learning_rate": 2.8325074707546397e-05,
"loss": 0.102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03835485503077507,
"step": 3675,
"valid_targets_mean": 3380.2,
"valid_targets_min": 941
},
{
"epoch": 2.9947089947089944,
"grad_norm": 0.3685878918749171,
"learning_rate": 2.8288161596592445e-05,
"loss": 0.1049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029963500797748566,
"step": 3680,
"valid_targets_mean": 2062.9,
"valid_targets_min": 759
},
{
"epoch": 2.998778998778999,
"grad_norm": 0.5570354007672066,
"learning_rate": 2.8251214367016584e-05,
"loss": 0.1036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11446891725063324,
"step": 3685,
"valid_targets_mean": 2155.2,
"valid_targets_min": 927
},
{
"epoch": 3.0024420024420024,
"grad_norm": 0.5300936680238741,
"learning_rate": 2.8214233170913897e-05,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10420374572277069,
"step": 3690,
"valid_targets_mean": 5435.1,
"valid_targets_min": 3516
},
{
"epoch": 3.0065120065120063,
"grad_norm": 0.38181099491046794,
"learning_rate": 2.8177218160519274e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10185196250677109,
"step": 3695,
"valid_targets_mean": 7654.2,
"valid_targets_min": 6354
},
{
"epoch": 3.0105820105820107,
"grad_norm": 0.3636523334412447,
"learning_rate": 2.8140169488206813e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11651530861854553,
"step": 3700,
"valid_targets_mean": 7341.6,
"valid_targets_min": 5754
},
{
"epoch": 3.0146520146520146,
"grad_norm": 0.35386050254952656,
"learning_rate": 2.810308730648919e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0877489298582077,
"step": 3705,
"valid_targets_mean": 7666.2,
"valid_targets_min": 5666
},
{
"epoch": 3.0187220187220185,
"grad_norm": 0.39000718209727786,
"learning_rate": 2.8065971768017014e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1017606109380722,
"step": 3710,
"valid_targets_mean": 7469.0,
"valid_targets_min": 5646
},
{
"epoch": 3.022792022792023,
"grad_norm": 0.3982430381116518,
"learning_rate": 2.802882302557821e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11622816324234009,
"step": 3715,
"valid_targets_mean": 7046.9,
"valid_targets_min": 5571
},
{
"epoch": 3.0268620268620268,
"grad_norm": 0.3840578048570892,
"learning_rate": 2.7991641232097385e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11238230019807816,
"step": 3720,
"valid_targets_mean": 7827.6,
"valid_targets_min": 5405
},
{
"epoch": 3.030932030932031,
"grad_norm": 0.37593713287199076,
"learning_rate": 2.7954426540635213e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10586348176002502,
"step": 3725,
"valid_targets_mean": 7023.5,
"valid_targets_min": 5664
},
{
"epoch": 3.035002035002035,
"grad_norm": 0.3617967688248237,
"learning_rate": 2.7917179104387792e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09483138471841812,
"step": 3730,
"valid_targets_mean": 7069.8,
"valid_targets_min": 5103
},
{
"epoch": 3.039072039072039,
"grad_norm": 0.37727049937650137,
"learning_rate": 2.787989907668601e-05,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09244755655527115,
"step": 3735,
"valid_targets_mean": 6712.4,
"valid_targets_min": 5469
},
{
"epoch": 3.0431420431420433,
"grad_norm": 0.3766512807014509,
"learning_rate": 2.7842586610994913e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09342852234840393,
"step": 3740,
"valid_targets_mean": 7289.2,
"valid_targets_min": 5513
},
{
"epoch": 3.047212047212047,
"grad_norm": 0.3695612492414105,
"learning_rate": 2.7805241860913095e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09307433664798737,
"step": 3745,
"valid_targets_mean": 7022.1,
"valid_targets_min": 5691
},
{
"epoch": 3.051282051282051,
"grad_norm": 0.39612551211364405,
"learning_rate": 2.7767864980172046e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10077991336584091,
"step": 3750,
"valid_targets_mean": 6736.0,
"valid_targets_min": 5550
},
{
"epoch": 3.0553520553520555,
"grad_norm": 0.4921659164636033,
"learning_rate": 2.773045612263552e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09157957881689072,
"step": 3755,
"valid_targets_mean": 6346.9,
"valid_targets_min": 5067
},
{
"epoch": 3.0594220594220594,
"grad_norm": 0.4073510419270923,
"learning_rate": 2.7693015442298896e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.095358707010746,
"step": 3760,
"valid_targets_mean": 6784.0,
"valid_targets_min": 5618
},
{
"epoch": 3.0634920634920633,
"grad_norm": 0.4015377800668027,
"learning_rate": 2.7655543093288567e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10923737287521362,
"step": 3765,
"valid_targets_mean": 7568.4,
"valid_targets_min": 5856
},
{
"epoch": 3.0675620675620676,
"grad_norm": 0.4034210421570319,
"learning_rate": 2.7618039229861298e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09021735936403275,
"step": 3770,
"valid_targets_mean": 7198.5,
"valid_targets_min": 4793
},
{
"epoch": 3.0716320716320715,
"grad_norm": 0.3908082661531363,
"learning_rate": 2.7580504006403565e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09716609120368958,
"step": 3775,
"valid_targets_mean": 6680.5,
"valid_targets_min": 5350
},
{
"epoch": 3.075702075702076,
"grad_norm": 0.38406455833735326,
"learning_rate": 2.7542937577430947e-05,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1004624292254448,
"step": 3780,
"valid_targets_mean": 6770.6,
"valid_targets_min": 5753
},
{
"epoch": 3.07977207977208,
"grad_norm": 0.7240136077873857,
"learning_rate": 2.7505340097587488e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07324851304292679,
"step": 3785,
"valid_targets_mean": 1419.8,
"valid_targets_min": 289
},
{
"epoch": 3.0838420838420837,
"grad_norm": 0.4204933410198007,
"learning_rate": 2.7467711721645045e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09934137761592865,
"step": 3790,
"valid_targets_mean": 6784.2,
"valid_targets_min": 5042
},
{
"epoch": 3.087912087912088,
"grad_norm": 0.3742729131572597,
"learning_rate": 2.7430052604502663e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09341548383235931,
"step": 3795,
"valid_targets_mean": 6774.9,
"valid_targets_min": 3875
},
{
"epoch": 3.091982091982092,
"grad_norm": 0.41169203877187577,
"learning_rate": 2.7392362901185944e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09741862118244171,
"step": 3800,
"valid_targets_mean": 7047.6,
"valid_targets_min": 6134
},
{
"epoch": 3.096052096052096,
"grad_norm": 0.3908141039193812,
"learning_rate": 2.7354642766846383e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10031354427337646,
"step": 3805,
"valid_targets_mean": 6886.6,
"valid_targets_min": 5869
},
{
"epoch": 3.1001221001221,
"grad_norm": 0.3737173994845085,
"learning_rate": 2.7316892356760768e-05,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0877181887626648,
"step": 3810,
"valid_targets_mean": 7559.8,
"valid_targets_min": 6145
},
{
"epoch": 3.104192104192104,
"grad_norm": 0.345233755743295,
"learning_rate": 2.727911182633049e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08521901816129684,
"step": 3815,
"valid_targets_mean": 8920.5,
"valid_targets_min": 4780
},
{
"epoch": 3.1082621082621085,
"grad_norm": 0.3279700741389342,
"learning_rate": 2.724130133108096e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07514619082212448,
"step": 3820,
"valid_targets_mean": 7393.4,
"valid_targets_min": 5116
},
{
"epoch": 3.1123321123321124,
"grad_norm": 0.31728564944220194,
"learning_rate": 2.720346102666092e-05,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08252862095832825,
"step": 3825,
"valid_targets_mean": 8477.5,
"valid_targets_min": 4033
},
{
"epoch": 3.1164021164021163,
"grad_norm": 0.3897732561895216,
"learning_rate": 2.7165591068841835e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09388996660709381,
"step": 3830,
"valid_targets_mean": 6736.6,
"valid_targets_min": 4646
},
{
"epoch": 3.1204721204721206,
"grad_norm": 0.4003693550688361,
"learning_rate": 2.7127691613517236e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09637527167797089,
"step": 3835,
"valid_targets_mean": 7551.5,
"valid_targets_min": 5461
},
{
"epoch": 3.1245421245421245,
"grad_norm": 0.42189953518448664,
"learning_rate": 2.7089762816702072e-05,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11182335764169693,
"step": 3840,
"valid_targets_mean": 7091.0,
"valid_targets_min": 4879
},
{
"epoch": 3.1286121286121285,
"grad_norm": 0.3964626223828562,
"learning_rate": 2.70518048345321e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08981172740459442,
"step": 3845,
"valid_targets_mean": 6269.8,
"valid_targets_min": 4606
},
{
"epoch": 3.132682132682133,
"grad_norm": 0.4236778964061071,
"learning_rate": 2.7013817823263206e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08929223567247391,
"step": 3850,
"valid_targets_mean": 6818.4,
"valid_targets_min": 5525
},
{
"epoch": 3.1367521367521367,
"grad_norm": 0.4184282493040094,
"learning_rate": 2.6975801939270762e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09297116100788116,
"step": 3855,
"valid_targets_mean": 7365.4,
"valid_targets_min": 5000
},
{
"epoch": 3.1408221408221406,
"grad_norm": 0.3991658399742734,
"learning_rate": 2.6937757339049027e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08477732539176941,
"step": 3860,
"valid_targets_mean": 6212.1,
"valid_targets_min": 3988
},
{
"epoch": 3.144892144892145,
"grad_norm": 0.3522450277037621,
"learning_rate": 2.6899684179210446e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09426316618919373,
"step": 3865,
"valid_targets_mean": 8396.9,
"valid_targets_min": 6131
},
{
"epoch": 3.148962148962149,
"grad_norm": 0.40217083920878643,
"learning_rate": 2.6861582616485048e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09596344083547592,
"step": 3870,
"valid_targets_mean": 7651.0,
"valid_targets_min": 4061
},
{
"epoch": 3.1530321530321532,
"grad_norm": 0.38649324870646884,
"learning_rate": 2.6823452807719763e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09395226836204529,
"step": 3875,
"valid_targets_mean": 7090.1,
"valid_targets_min": 5203
},
{
"epoch": 3.157102157102157,
"grad_norm": 0.37118239164661415,
"learning_rate": 2.678529490987783e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09067308902740479,
"step": 3880,
"valid_targets_mean": 7001.0,
"valid_targets_min": 5362
},
{
"epoch": 3.161172161172161,
"grad_norm": 0.3848861837027517,
"learning_rate": 2.674710908003808e-05,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09417563676834106,
"step": 3885,
"valid_targets_mean": 6359.2,
"valid_targets_min": 5236
},
{
"epoch": 3.1652421652421654,
"grad_norm": 0.407400812686477,
"learning_rate": 2.6708895475394362e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10153548419475555,
"step": 3890,
"valid_targets_mean": 5939.8,
"valid_targets_min": 4693
},
{
"epoch": 3.1693121693121693,
"grad_norm": 1.1139169285060038,
"learning_rate": 2.6670654253254834e-05,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03590000420808792,
"step": 3895,
"valid_targets_mean": 208.6,
"valid_targets_min": 134
},
{
"epoch": 3.173382173382173,
"grad_norm": 0.4169772802304493,
"learning_rate": 2.663238557104136e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09831123054027557,
"step": 3900,
"valid_targets_mean": 6008.5,
"valid_targets_min": 4956
},
{
"epoch": 3.1774521774521776,
"grad_norm": 0.37807853509176925,
"learning_rate": 2.659408958628883e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08299198746681213,
"step": 3905,
"valid_targets_mean": 6042.0,
"valid_targets_min": 4817
},
{
"epoch": 3.1815221815221815,
"grad_norm": 0.3981260221085175,
"learning_rate": 2.6555766456644553e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09234784543514252,
"step": 3910,
"valid_targets_mean": 6608.6,
"valid_targets_min": 5102
},
{
"epoch": 3.185592185592186,
"grad_norm": 0.3880642673862131,
"learning_rate": 2.6517416339867544e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09438446909189224,
"step": 3915,
"valid_targets_mean": 6670.1,
"valid_targets_min": 4869
},
{
"epoch": 3.1896621896621897,
"grad_norm": 0.38644112067025166,
"learning_rate": 2.6479039393827944e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08336789160966873,
"step": 3920,
"valid_targets_mean": 6088.4,
"valid_targets_min": 4946
},
{
"epoch": 3.1937321937321936,
"grad_norm": 0.4014072145721109,
"learning_rate": 2.6440635776506316e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08969050645828247,
"step": 3925,
"valid_targets_mean": 6228.4,
"valid_targets_min": 4856
},
{
"epoch": 3.197802197802198,
"grad_norm": 0.4562972639302328,
"learning_rate": 2.6402205645993038e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09550561010837555,
"step": 3930,
"valid_targets_mean": 5376.6,
"valid_targets_min": 4145
},
{
"epoch": 3.201872201872202,
"grad_norm": 0.48273208307655285,
"learning_rate": 2.636374916048761e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09403058886528015,
"step": 3935,
"valid_targets_mean": 6309.2,
"valid_targets_min": 5305
},
{
"epoch": 3.205942205942206,
"grad_norm": 0.40883426520856037,
"learning_rate": 2.6325266478298032e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08947273343801498,
"step": 3940,
"valid_targets_mean": 6221.5,
"valid_targets_min": 4636
},
{
"epoch": 3.21001221001221,
"grad_norm": 0.39532763897190637,
"learning_rate": 2.6286757757840144e-05,
"loss": 0.1858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09781331568956375,
"step": 3945,
"valid_targets_mean": 6831.5,
"valid_targets_min": 5668
},
{
"epoch": 3.214082214082214,
"grad_norm": 0.4023824820856924,
"learning_rate": 2.6248223157636982e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09898592531681061,
"step": 3950,
"valid_targets_mean": 6437.1,
"valid_targets_min": 5004
},
{
"epoch": 3.218152218152218,
"grad_norm": 0.4037103091391165,
"learning_rate": 2.62096628363181e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0871603712439537,
"step": 3955,
"valid_targets_mean": 6205.8,
"valid_targets_min": 5341
},
{
"epoch": 3.2222222222222223,
"grad_norm": 0.4037836380504369,
"learning_rate": 2.6171076952618943e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09813414514064789,
"step": 3960,
"valid_targets_mean": 6748.0,
"valid_targets_min": 5363
},
{
"epoch": 3.2262922262922262,
"grad_norm": 0.407885387401038,
"learning_rate": 2.61324656653802e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0859188586473465,
"step": 3965,
"valid_targets_mean": 5210.5,
"valid_targets_min": 791
},
{
"epoch": 3.23036223036223,
"grad_norm": 0.6923397809278381,
"learning_rate": 2.60938291335471e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07540939748287201,
"step": 3970,
"valid_targets_mean": 1279.5,
"valid_targets_min": 746
},
{
"epoch": 3.2344322344322345,
"grad_norm": 0.7921805175588379,
"learning_rate": 2.6055167516168828e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09494996815919876,
"step": 3975,
"valid_targets_mean": 1635.8,
"valid_targets_min": 661
},
{
"epoch": 3.2385022385022384,
"grad_norm": 0.7552177145973241,
"learning_rate": 2.6016480972397807e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08284762501716614,
"step": 3980,
"valid_targets_mean": 1420.2,
"valid_targets_min": 826
},
{
"epoch": 3.2425722425722427,
"grad_norm": 0.768222331032816,
"learning_rate": 2.5977769661489102e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07532330602407455,
"step": 3985,
"valid_targets_mean": 1399.9,
"valid_targets_min": 742
},
{
"epoch": 3.2466422466422467,
"grad_norm": 0.7896098768251143,
"learning_rate": 2.5939033742799692e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06821978092193604,
"step": 3990,
"valid_targets_mean": 1309.9,
"valid_targets_min": 718
},
{
"epoch": 3.2507122507122506,
"grad_norm": 0.7418241829283232,
"learning_rate": 2.5900273375787898e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0990295559167862,
"step": 3995,
"valid_targets_mean": 1729.4,
"valid_targets_min": 764
},
{
"epoch": 3.254782254782255,
"grad_norm": 0.6949460534292148,
"learning_rate": 2.586148872001265e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08115358650684357,
"step": 4000,
"valid_targets_mean": 1651.4,
"valid_targets_min": 814
},
{
"epoch": 3.258852258852259,
"grad_norm": 0.8287359657436814,
"learning_rate": 2.5822679935132876e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06513510644435883,
"step": 4005,
"valid_targets_mean": 1192.0,
"valid_targets_min": 610
},
{
"epoch": 3.2629222629222627,
"grad_norm": 0.7416322068860572,
"learning_rate": 2.578384718090685e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09329591691493988,
"step": 4010,
"valid_targets_mean": 1879.0,
"valid_targets_min": 817
},
{
"epoch": 3.266992266992267,
"grad_norm": 0.6590970920655556,
"learning_rate": 2.5744990617191486e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.075216144323349,
"step": 4015,
"valid_targets_mean": 1500.4,
"valid_targets_min": 837
},
{
"epoch": 3.271062271062271,
"grad_norm": 0.7902390874577276,
"learning_rate": 2.5706110403941724e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11390472203493118,
"step": 4020,
"valid_targets_mean": 1661.8,
"valid_targets_min": 593
},
{
"epoch": 3.2751322751322753,
"grad_norm": 0.6950850372161688,
"learning_rate": 2.5667206701209876e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08275754749774933,
"step": 4025,
"valid_targets_mean": 1537.8,
"valid_targets_min": 704
},
{
"epoch": 3.2792022792022792,
"grad_norm": 0.7394050894613096,
"learning_rate": 2.562827966914492e-05,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06054488569498062,
"step": 4030,
"valid_targets_mean": 1227.0,
"valid_targets_min": 722
},
{
"epoch": 3.283272283272283,
"grad_norm": 0.6772775941130794,
"learning_rate": 2.5589329467991885e-05,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07103030383586884,
"step": 4035,
"valid_targets_mean": 1364.5,
"valid_targets_min": 642
},
{
"epoch": 3.2873422873422875,
"grad_norm": 0.7940146053459805,
"learning_rate": 2.555035625809118e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07808074355125427,
"step": 4040,
"valid_targets_mean": 1358.5,
"valid_targets_min": 518
},
{
"epoch": 3.2914122914122914,
"grad_norm": 0.7802294896653876,
"learning_rate": 2.5511360199877934e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10007496178150177,
"step": 4045,
"valid_targets_mean": 1590.6,
"valid_targets_min": 728
},
{
"epoch": 3.2954822954822953,
"grad_norm": 0.7087462700416979,
"learning_rate": 2.5472341453881316e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1003953143954277,
"step": 4050,
"valid_targets_mean": 1791.4,
"valid_targets_min": 820
},
{
"epoch": 3.2995522995522997,
"grad_norm": 0.7315742027165163,
"learning_rate": 2.543330018072389e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09038805961608887,
"step": 4055,
"valid_targets_mean": 1470.8,
"valid_targets_min": 818
},
{
"epoch": 3.3036223036223036,
"grad_norm": 0.7849182759993877,
"learning_rate": 2.5394236541120978e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06879038363695145,
"step": 4060,
"valid_targets_mean": 1278.6,
"valid_targets_min": 625
},
{
"epoch": 3.3076923076923075,
"grad_norm": 0.6965689168981399,
"learning_rate": 2.5355150695879952e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1073441207408905,
"step": 4065,
"valid_targets_mean": 2313.5,
"valid_targets_min": 790
},
{
"epoch": 3.311762311762312,
"grad_norm": 0.7410314939380847,
"learning_rate": 2.5316042805899616e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11727465689182281,
"step": 4070,
"valid_targets_mean": 2231.9,
"valid_targets_min": 1335
},
{
"epoch": 3.3158323158323157,
"grad_norm": 0.6764884077292488,
"learning_rate": 2.5276913032169485e-05,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09181191027164459,
"step": 4075,
"valid_targets_mean": 1729.5,
"valid_targets_min": 719
},
{
"epoch": 3.3199023199023197,
"grad_norm": 0.7670282548657762,
"learning_rate": 2.52377615357692e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06349903345108032,
"step": 4080,
"valid_targets_mean": 1222.9,
"valid_targets_min": 697
},
{
"epoch": 3.323972323972324,
"grad_norm": 0.7717936984864601,
"learning_rate": 2.5198588477867806e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09327976405620575,
"step": 4085,
"valid_targets_mean": 1521.1,
"valid_targets_min": 998
},
{
"epoch": 3.328042328042328,
"grad_norm": 0.7083051922595436,
"learning_rate": 2.515939401972311e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08291327953338623,
"step": 4090,
"valid_targets_mean": 1693.9,
"valid_targets_min": 629
},
{
"epoch": 3.3321123321123323,
"grad_norm": 0.7259684658670004,
"learning_rate": 2.5120178322681003e-05,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0862584039568901,
"step": 4095,
"valid_targets_mean": 1630.2,
"valid_targets_min": 1078
},
{
"epoch": 3.336182336182336,
"grad_norm": 0.6785358648236004,
"learning_rate": 2.5080941548174825e-05,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07994429767131805,
"step": 4100,
"valid_targets_mean": 1843.0,
"valid_targets_min": 1075
},
{
"epoch": 3.34025234025234,
"grad_norm": 0.7835115275000952,
"learning_rate": 2.5041683857724676e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09122762084007263,
"step": 4105,
"valid_targets_mean": 1848.2,
"valid_targets_min": 1317
},
{
"epoch": 3.3443223443223444,
"grad_norm": 0.7678656781444083,
"learning_rate": 2.5002405412936748e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09253916144371033,
"step": 4110,
"valid_targets_mean": 1727.4,
"valid_targets_min": 957
},
{
"epoch": 3.3483923483923483,
"grad_norm": 0.7652220167507279,
"learning_rate": 2.4963106375502673e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0644087865948677,
"step": 4115,
"valid_targets_mean": 1115.4,
"valid_targets_min": 643
},
{
"epoch": 3.3524623524623527,
"grad_norm": 0.749831847944443,
"learning_rate": 2.492378690719887e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08243843168020248,
"step": 4120,
"valid_targets_mean": 1547.2,
"valid_targets_min": 1111
},
{
"epoch": 3.3565323565323566,
"grad_norm": 0.7150068797955984,
"learning_rate": 2.4884447169885855e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07063218951225281,
"step": 4125,
"valid_targets_mean": 1450.0,
"valid_targets_min": 705
},
{
"epoch": 3.3606023606023605,
"grad_norm": 0.8508456830574319,
"learning_rate": 2.4845087325507557e-05,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08344951272010803,
"step": 4130,
"valid_targets_mean": 1539.0,
"valid_targets_min": 1288
},
{
"epoch": 3.364672364672365,
"grad_norm": 0.75421710601425,
"learning_rate": 2.4805707536090708e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0741521492600441,
"step": 4135,
"valid_targets_mean": 1321.2,
"valid_targets_min": 753
},
{
"epoch": 3.3687423687423688,
"grad_norm": 0.737658592772203,
"learning_rate": 2.476630796374413e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07522574812173843,
"step": 4140,
"valid_targets_mean": 1480.0,
"valid_targets_min": 817
},
{
"epoch": 3.3728123728123727,
"grad_norm": 0.7186314188969304,
"learning_rate": 2.4726888770658103e-05,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06374834477901459,
"step": 4145,
"valid_targets_mean": 1293.9,
"valid_targets_min": 974
},
{
"epoch": 3.376882376882377,
"grad_norm": 0.7633726706709022,
"learning_rate": 2.4687450119103637e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08639413118362427,
"step": 4150,
"valid_targets_mean": 1529.2,
"valid_targets_min": 657
},
{
"epoch": 3.380952380952381,
"grad_norm": 1.1964337610025615,
"learning_rate": 2.464799217143188e-05,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0945994108915329,
"step": 4155,
"valid_targets_mean": 1678.0,
"valid_targets_min": 880
},
{
"epoch": 3.385022385022385,
"grad_norm": 0.7985356155534645,
"learning_rate": 2.46085150900734e-05,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09271052479743958,
"step": 4160,
"valid_targets_mean": 1609.4,
"valid_targets_min": 1050
},
{
"epoch": 3.389092389092389,
"grad_norm": 1.0437056142019698,
"learning_rate": 2.4569019037537525e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07413659244775772,
"step": 4165,
"valid_targets_mean": 1449.0,
"valid_targets_min": 682
},
{
"epoch": 3.393162393162393,
"grad_norm": 0.7535290857067112,
"learning_rate": 2.4529504176411685e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07152436673641205,
"step": 4170,
"valid_targets_mean": 1344.0,
"valid_targets_min": 703
},
{
"epoch": 3.397232397232397,
"grad_norm": 0.805609957537731,
"learning_rate": 2.448997066936073e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07804272323846817,
"step": 4175,
"valid_targets_mean": 1469.4,
"valid_targets_min": 934
},
{
"epoch": 3.4013024013024014,
"grad_norm": 0.9417672703147607,
"learning_rate": 2.445041867912629e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11873181909322739,
"step": 4180,
"valid_targets_mean": 1829.1,
"valid_targets_min": 734
},
{
"epoch": 3.4053724053724053,
"grad_norm": 1.044289943148221,
"learning_rate": 2.4410848368526053e-05,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10154280066490173,
"step": 4185,
"valid_targets_mean": 2010.8,
"valid_targets_min": 1437
},
{
"epoch": 3.4094424094424096,
"grad_norm": 0.7104274369527875,
"learning_rate": 2.4371259900453126e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060282643884420395,
"step": 4190,
"valid_targets_mean": 1405.2,
"valid_targets_min": 551
},
{
"epoch": 3.4135124135124135,
"grad_norm": 0.8437670408273207,
"learning_rate": 2.433165343787538e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10241234302520752,
"step": 4195,
"valid_targets_mean": 1817.6,
"valid_targets_min": 931
},
{
"epoch": 3.4175824175824174,
"grad_norm": 0.726473705947651,
"learning_rate": 2.4292029143834756e-05,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07595465332269669,
"step": 4200,
"valid_targets_mean": 1599.1,
"valid_targets_min": 904
},
{
"epoch": 3.421652421652422,
"grad_norm": 0.7469567163494483,
"learning_rate": 2.425238718144659e-05,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08603636920452118,
"step": 4205,
"valid_targets_mean": 1774.8,
"valid_targets_min": 1158
},
{
"epoch": 3.4257224257224257,
"grad_norm": 0.8033287596020903,
"learning_rate": 2.4212727713898948e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07098281383514404,
"step": 4210,
"valid_targets_mean": 1229.2,
"valid_targets_min": 756
},
{
"epoch": 3.42979242979243,
"grad_norm": 0.8172817454896187,
"learning_rate": 2.417305090445198e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08913031220436096,
"step": 4215,
"valid_targets_mean": 1536.9,
"valid_targets_min": 854
},
{
"epoch": 3.433862433862434,
"grad_norm": 0.7239421409227166,
"learning_rate": 2.4133356916437202e-05,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0854625403881073,
"step": 4220,
"valid_targets_mean": 1739.5,
"valid_targets_min": 1462
},
{
"epoch": 3.437932437932438,
"grad_norm": 0.7197452670352181,
"learning_rate": 2.4093645913256855e-05,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06945577263832092,
"step": 4225,
"valid_targets_mean": 1475.9,
"valid_targets_min": 944
},
{
"epoch": 3.442002442002442,
"grad_norm": 0.7090142042404015,
"learning_rate": 2.405391805838322e-05,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07137700915336609,
"step": 4230,
"valid_targets_mean": 1482.6,
"valid_targets_min": 1227
},
{
"epoch": 3.446072446072446,
"grad_norm": 0.7513863866998308,
"learning_rate": 2.401417351535795e-05,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06505010277032852,
"step": 4235,
"valid_targets_mean": 1276.5,
"valid_targets_min": 740
},
{
"epoch": 3.45014245014245,
"grad_norm": 0.7487725404958699,
"learning_rate": 2.3974412447791403e-05,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09261137992143631,
"step": 4240,
"valid_targets_mean": 2024.8,
"valid_targets_min": 881
},
{
"epoch": 3.4542124542124544,
"grad_norm": 0.8187666821446936,
"learning_rate": 2.3934635019361955e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08315032720565796,
"step": 4245,
"valid_targets_mean": 1288.6,
"valid_targets_min": 636
},
{
"epoch": 3.4582824582824583,
"grad_norm": 0.753634047230146,
"learning_rate": 2.3894841393815323e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055352650582790375,
"step": 4250,
"valid_targets_mean": 1103.9,
"valid_targets_min": 814
},
{
"epoch": 3.462352462352462,
"grad_norm": 0.8079463943992531,
"learning_rate": 2.3855031734963925e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07735898345708847,
"step": 4255,
"valid_targets_mean": 1392.9,
"valid_targets_min": 820
},
{
"epoch": 3.4664224664224665,
"grad_norm": 0.7707769218886613,
"learning_rate": 2.3815206206686144e-05,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06932565569877625,
"step": 4260,
"valid_targets_mean": 1392.4,
"valid_targets_min": 661
},
{
"epoch": 3.4704924704924704,
"grad_norm": 0.7958744117773525,
"learning_rate": 2.3775364972925737e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07428084313869476,
"step": 4265,
"valid_targets_mean": 1441.8,
"valid_targets_min": 728
},
{
"epoch": 3.4745624745624744,
"grad_norm": 0.7647293162181219,
"learning_rate": 2.3735508197691068e-05,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07184837758541107,
"step": 4270,
"valid_targets_mean": 1413.5,
"valid_targets_min": 692
},
{
"epoch": 3.4786324786324787,
"grad_norm": 0.760684869364684,
"learning_rate": 2.369563604505451e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07639266550540924,
"step": 4275,
"valid_targets_mean": 1323.5,
"valid_targets_min": 840
},
{
"epoch": 3.4827024827024826,
"grad_norm": 0.785131473550303,
"learning_rate": 2.365574867915172e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07727733254432678,
"step": 4280,
"valid_targets_mean": 1488.4,
"valid_targets_min": 950
},
{
"epoch": 3.4867724867724865,
"grad_norm": 0.712055390091951,
"learning_rate": 2.361584626418099e-05,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08490264415740967,
"step": 4285,
"valid_targets_mean": 1935.9,
"valid_targets_min": 878
},
{
"epoch": 3.490842490842491,
"grad_norm": 0.8293965286613701,
"learning_rate": 2.3575928964402558e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08114030957221985,
"step": 4290,
"valid_targets_mean": 1502.1,
"valid_targets_min": 836
},
{
"epoch": 3.494912494912495,
"grad_norm": 0.7983467061857048,
"learning_rate": 2.353599694413794e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08377361297607422,
"step": 4295,
"valid_targets_mean": 1535.1,
"valid_targets_min": 1013
},
{
"epoch": 3.498982498982499,
"grad_norm": 0.7795845542928671,
"learning_rate": 2.349605036776925e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06817035377025604,
"step": 4300,
"valid_targets_mean": 1346.4,
"valid_targets_min": 748
},
{
"epoch": 3.503052503052503,
"grad_norm": 0.9206942614110478,
"learning_rate": 2.3456089399738514e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.079506516456604,
"step": 4305,
"valid_targets_mean": 1543.9,
"valid_targets_min": 729
},
{
"epoch": 3.5071225071225074,
"grad_norm": 0.7302785723268027,
"learning_rate": 2.3416114204547e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07028716802597046,
"step": 4310,
"valid_targets_mean": 1541.9,
"valid_targets_min": 1219
},
{
"epoch": 3.5111925111925113,
"grad_norm": 0.7112489536142887,
"learning_rate": 2.3376124946754574e-05,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07776269316673279,
"step": 4315,
"valid_targets_mean": 1632.8,
"valid_targets_min": 916
},
{
"epoch": 3.515262515262515,
"grad_norm": 0.7261049103300148,
"learning_rate": 2.3336121790978955e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06957513093948364,
"step": 4320,
"valid_targets_mean": 1349.9,
"valid_targets_min": 646
},
{
"epoch": 3.5193325193325196,
"grad_norm": 0.7903987711410705,
"learning_rate": 2.3296104901895074e-05,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08000437915325165,
"step": 4325,
"valid_targets_mean": 1383.0,
"valid_targets_min": 906
},
{
"epoch": 3.5234025234025235,
"grad_norm": 0.7622357569514845,
"learning_rate": 2.3256074444234437e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07310856133699417,
"step": 4330,
"valid_targets_mean": 1577.5,
"valid_targets_min": 848
},
{
"epoch": 3.5274725274725274,
"grad_norm": 0.8743060398490866,
"learning_rate": 2.3216030582784358e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07247571647167206,
"step": 4335,
"valid_targets_mean": 1183.5,
"valid_targets_min": 692
},
{
"epoch": 3.5315425315425317,
"grad_norm": 0.7953087241662045,
"learning_rate": 2.317597348238735e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06898859143257141,
"step": 4340,
"valid_targets_mean": 1373.9,
"valid_targets_min": 821
},
{
"epoch": 3.5356125356125356,
"grad_norm": 0.7438998227523352,
"learning_rate": 2.3135903307940425e-05,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06783884018659592,
"step": 4345,
"valid_targets_mean": 1428.1,
"valid_targets_min": 1013
},
{
"epoch": 3.5396825396825395,
"grad_norm": 0.7403466593709432,
"learning_rate": 2.3095820224394418e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06895196437835693,
"step": 4350,
"valid_targets_mean": 1420.9,
"valid_targets_min": 781
},
{
"epoch": 3.543752543752544,
"grad_norm": 0.7776344239197351,
"learning_rate": 2.305572439675329e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08171670138835907,
"step": 4355,
"valid_targets_mean": 1255.1,
"valid_targets_min": 548
},
{
"epoch": 3.547822547822548,
"grad_norm": 0.7334294368492669,
"learning_rate": 2.3015615990073483e-05,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0776100903749466,
"step": 4360,
"valid_targets_mean": 1411.0,
"valid_targets_min": 694
},
{
"epoch": 3.5518925518925517,
"grad_norm": 0.7080206142881729,
"learning_rate": 2.29754951694632e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0899009108543396,
"step": 4365,
"valid_targets_mean": 1973.8,
"valid_targets_min": 1030
},
{
"epoch": 3.555962555962556,
"grad_norm": 0.6615510612620584,
"learning_rate": 2.2935362100081767e-05,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.061547666788101196,
"step": 4370,
"valid_targets_mean": 1580.2,
"valid_targets_min": 682
},
{
"epoch": 3.56003256003256,
"grad_norm": 0.81839532426026,
"learning_rate": 2.2895216947138924e-05,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07387113571166992,
"step": 4375,
"valid_targets_mean": 1425.4,
"valid_targets_min": 990
},
{
"epoch": 3.564102564102564,
"grad_norm": 0.7054362018903443,
"learning_rate": 2.285505987589415e-05,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055615417659282684,
"step": 4380,
"valid_targets_mean": 1299.6,
"valid_targets_min": 639
},
{
"epoch": 3.5681725681725682,
"grad_norm": 0.8007028427332834,
"learning_rate": 2.281489105165599e-05,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0648592859506607,
"step": 4385,
"valid_targets_mean": 1458.8,
"valid_targets_min": 721
},
{
"epoch": 3.572242572242572,
"grad_norm": 0.8445299441357773,
"learning_rate": 2.277471063978137e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07231980562210083,
"step": 4390,
"valid_targets_mean": 1329.8,
"valid_targets_min": 874
},
{
"epoch": 3.576312576312576,
"grad_norm": 0.6807816095455992,
"learning_rate": 2.2734518805674913e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07544272392988205,
"step": 4395,
"valid_targets_mean": 1559.9,
"valid_targets_min": 686
},
{
"epoch": 3.5803825803825804,
"grad_norm": 0.8452163681063782,
"learning_rate": 2.269431571478828e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08027100563049316,
"step": 4400,
"valid_targets_mean": 1392.5,
"valid_targets_min": 713
},
{
"epoch": 3.5844525844525843,
"grad_norm": 0.7806355035255146,
"learning_rate": 2.2654101532619443e-05,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06163328140974045,
"step": 4405,
"valid_targets_mean": 1209.0,
"valid_targets_min": 393
},
{
"epoch": 3.5885225885225887,
"grad_norm": 0.48984256846528007,
"learning_rate": 2.2613876424712052e-05,
"loss": 0.1305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04831802099943161,
"step": 4410,
"valid_targets_mean": 2470.8,
"valid_targets_min": 816
},
{
"epoch": 3.5925925925925926,
"grad_norm": 0.39618952222130516,
"learning_rate": 2.257364055665473e-05,
"loss": 0.0913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04768257588148117,
"step": 4415,
"valid_targets_mean": 3278.9,
"valid_targets_min": 2461
},
{
"epoch": 3.596662596662597,
"grad_norm": 0.39078618847965113,
"learning_rate": 2.2533394094080397e-05,
"loss": 0.0877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048612505197525024,
"step": 4420,
"valid_targets_mean": 3783.6,
"valid_targets_min": 2571
},
{
"epoch": 3.600732600732601,
"grad_norm": 0.3479538454031919,
"learning_rate": 2.2493137202665566e-05,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046523869037628174,
"step": 4425,
"valid_targets_mean": 3905.0,
"valid_targets_min": 3179
},
{
"epoch": 3.6048026048026047,
"grad_norm": 0.40917149997042873,
"learning_rate": 2.2452870048129707e-05,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038769036531448364,
"step": 4430,
"valid_targets_mean": 3000.1,
"valid_targets_min": 943
},
{
"epoch": 3.608872608872609,
"grad_norm": 0.7387439093745595,
"learning_rate": 2.241259279623453e-05,
"loss": 0.1063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06168878823518753,
"step": 4435,
"valid_targets_mean": 974.8,
"valid_targets_min": 525
},
{
"epoch": 3.612942612942613,
"grad_norm": 0.43905368150585783,
"learning_rate": 2.2372305612783305e-05,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04938036948442459,
"step": 4440,
"valid_targets_mean": 2743.8,
"valid_targets_min": 954
},
{
"epoch": 3.617012617012617,
"grad_norm": 0.4689396969033086,
"learning_rate": 2.233200866362019e-05,
"loss": 0.094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060613177716732025,
"step": 4445,
"valid_targets_mean": 2744.4,
"valid_targets_min": 718
},
{
"epoch": 3.6210826210826212,
"grad_norm": 0.3460122217852074,
"learning_rate": 2.2291702114629542e-05,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0620415098965168,
"step": 4450,
"valid_targets_mean": 3279.1,
"valid_targets_min": 540
},
{
"epoch": 3.625152625152625,
"grad_norm": 0.2918413867985773,
"learning_rate": 2.225138613173524e-05,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033721111714839935,
"step": 4455,
"valid_targets_mean": 4515.5,
"valid_targets_min": 1008
},
{
"epoch": 3.629222629222629,
"grad_norm": 0.3411037126787543,
"learning_rate": 2.2211060880899996e-05,
"loss": 0.0876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04788324981927872,
"step": 4460,
"valid_targets_mean": 3701.6,
"valid_targets_min": 818
},
{
"epoch": 3.6332926332926334,
"grad_norm": 0.29653848428471286,
"learning_rate": 2.217072652812468e-05,
"loss": 0.0905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036281127482652664,
"step": 4465,
"valid_targets_mean": 3858.5,
"valid_targets_min": 1006
},
{
"epoch": 3.6373626373626373,
"grad_norm": 0.5325825065869296,
"learning_rate": 2.213038323944761e-05,
"loss": 0.1021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0998295247554779,
"step": 4470,
"valid_targets_mean": 2629.8,
"valid_targets_min": 614
},
{
"epoch": 3.6414326414326412,
"grad_norm": 0.37544688292236766,
"learning_rate": 2.209003118094392e-05,
"loss": 0.1219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03794893994927406,
"step": 4475,
"valid_targets_mean": 3368.0,
"valid_targets_min": 1997
},
{
"epoch": 3.6455026455026456,
"grad_norm": 0.5425961999646625,
"learning_rate": 2.2049670518724818e-05,
"loss": 0.0897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04944489151239395,
"step": 4480,
"valid_targets_mean": 1644.2,
"valid_targets_min": 674
},
{
"epoch": 3.6495726495726495,
"grad_norm": 0.31434891274177323,
"learning_rate": 2.2009301418936945e-05,
"loss": 0.0828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038889069110155106,
"step": 4485,
"valid_targets_mean": 3700.4,
"valid_targets_min": 989
},
{
"epoch": 3.6536426536426534,
"grad_norm": 0.3810739437224756,
"learning_rate": 2.1968924047761665e-05,
"loss": 0.0787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03368036821484566,
"step": 4490,
"valid_targets_mean": 3537.8,
"valid_targets_min": 2616
},
{
"epoch": 3.6577126577126577,
"grad_norm": 0.43609678797054763,
"learning_rate": 2.1928538571414416e-05,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05374626815319061,
"step": 4495,
"valid_targets_mean": 2184.5,
"valid_targets_min": 714
},
{
"epoch": 3.6617826617826617,
"grad_norm": 0.4437529891094936,
"learning_rate": 2.1888145156143966e-05,
"loss": 0.0984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05205199122428894,
"step": 4500,
"valid_targets_mean": 2054.5,
"valid_targets_min": 893
},
{
"epoch": 3.665852665852666,
"grad_norm": 0.43380985224197094,
"learning_rate": 2.184774396823178e-05,
"loss": 0.1051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0552193820476532,
"step": 4505,
"valid_targets_mean": 3681.5,
"valid_targets_min": 2353
},
{
"epoch": 3.66992266992267,
"grad_norm": 0.3799243340192024,
"learning_rate": 2.180733517399133e-05,
"loss": 0.0995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049977511167526245,
"step": 4510,
"valid_targets_mean": 3436.9,
"valid_targets_min": 1810
},
{
"epoch": 3.6739926739926743,
"grad_norm": 0.32571580848557247,
"learning_rate": 2.1766918939767394e-05,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036109715700149536,
"step": 4515,
"valid_targets_mean": 3740.8,
"valid_targets_min": 1955
},
{
"epoch": 3.678062678062678,
"grad_norm": 0.39033800490114573,
"learning_rate": 2.1726495431935364e-05,
"loss": 0.0864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04185417294502258,
"step": 4520,
"valid_targets_mean": 3092.0,
"valid_targets_min": 711
},
{
"epoch": 3.682132682132682,
"grad_norm": 0.6397111709341369,
"learning_rate": 2.1686064816900587e-05,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07134007662534714,
"step": 4525,
"valid_targets_mean": 1687.1,
"valid_targets_min": 643
},
{
"epoch": 3.6862026862026864,
"grad_norm": 0.5232501844782532,
"learning_rate": 2.164562726109766e-05,
"loss": 0.1125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04346204549074173,
"step": 4530,
"valid_targets_mean": 2173.0,
"valid_targets_min": 538
},
{
"epoch": 3.6902726902726903,
"grad_norm": 0.39995472780169194,
"learning_rate": 2.1605182930989764e-05,
"loss": 0.0916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03484119474887848,
"step": 4535,
"valid_targets_mean": 1954.0,
"valid_targets_min": 664
},
{
"epoch": 3.6943426943426942,
"grad_norm": 0.5523582831008328,
"learning_rate": 2.1564731993067958e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10305885225534439,
"step": 4540,
"valid_targets_mean": 2692.1,
"valid_targets_min": 1180
},
{
"epoch": 3.6984126984126986,
"grad_norm": 0.43560416380796335,
"learning_rate": 2.1524274613850495e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039621271193027496,
"step": 4545,
"valid_targets_mean": 2071.0,
"valid_targets_min": 756
},
{
"epoch": 3.7024827024827025,
"grad_norm": 0.35770234003575513,
"learning_rate": 2.1483810959882154e-05,
"loss": 0.1031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04059296101331711,
"step": 4550,
"valid_targets_mean": 3086.0,
"valid_targets_min": 844
},
{
"epoch": 3.7065527065527064,
"grad_norm": 0.6970042913323712,
"learning_rate": 2.144334119773355e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12542730569839478,
"step": 4555,
"valid_targets_mean": 2081.2,
"valid_targets_min": 1146
},
{
"epoch": 3.7106227106227108,
"grad_norm": 0.31025486801351915,
"learning_rate": 2.1402865494000435e-05,
"loss": 0.1039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0449528843164444,
"step": 4560,
"valid_targets_mean": 4426.4,
"valid_targets_min": 3507
},
{
"epoch": 3.7146927146927147,
"grad_norm": 0.3347224349640861,
"learning_rate": 2.1362384015303002e-05,
"loss": 0.0879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04645727574825287,
"step": 4565,
"valid_targets_mean": 4391.1,
"valid_targets_min": 3483
},
{
"epoch": 3.7187627187627186,
"grad_norm": 0.37334581619913065,
"learning_rate": 2.1321896928285256e-05,
"loss": 0.1023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048772167414426804,
"step": 4570,
"valid_targets_mean": 3939.6,
"valid_targets_min": 784
},
{
"epoch": 3.722832722832723,
"grad_norm": 0.4447642934119185,
"learning_rate": 2.128140439961426e-05,
"loss": 0.0878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033333856612443924,
"step": 4575,
"valid_targets_mean": 1469.4,
"valid_targets_min": 779
},
{
"epoch": 3.726902726902727,
"grad_norm": 0.5372359551407455,
"learning_rate": 2.1240906595979488e-05,
"loss": 0.0905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039604753255844116,
"step": 4580,
"valid_targets_mean": 1845.1,
"valid_targets_min": 674
},
{
"epoch": 3.7309727309727307,
"grad_norm": 0.4637069162414348,
"learning_rate": 2.1200403684092112e-05,
"loss": 0.0839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04348008334636688,
"step": 4585,
"valid_targets_mean": 2154.5,
"valid_targets_min": 712
},
{
"epoch": 3.735042735042735,
"grad_norm": 0.49301713165155914,
"learning_rate": 2.115989583068436e-05,
"loss": 0.0904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04291559010744095,
"step": 4590,
"valid_targets_mean": 3409.4,
"valid_targets_min": 2422
},
{
"epoch": 3.739112739112739,
"grad_norm": 0.34908985580550017,
"learning_rate": 2.1119383202508793e-05,
"loss": 0.0769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026736728847026825,
"step": 4595,
"valid_targets_mean": 2888.1,
"valid_targets_min": 576
},
{
"epoch": 3.743182743182743,
"grad_norm": 0.3051490004834012,
"learning_rate": 2.107886596633761e-05,
"loss": 0.1341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022518891841173172,
"step": 4600,
"valid_targets_mean": 3605.9,
"valid_targets_min": 772
},
{
"epoch": 3.7472527472527473,
"grad_norm": 0.39215842357161595,
"learning_rate": 2.1038344288961995e-05,
"loss": 0.0736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03927973657846451,
"step": 4605,
"valid_targets_mean": 2694.1,
"valid_targets_min": 722
},
{
"epoch": 3.751322751322751,
"grad_norm": 0.3416371707837828,
"learning_rate": 2.099781833719142e-05,
"loss": 0.0758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04170195013284683,
"step": 4610,
"valid_targets_mean": 3837.2,
"valid_targets_min": 2788
},
{
"epoch": 3.7553927553927555,
"grad_norm": 0.3686746265338282,
"learning_rate": 2.095728827785294e-05,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03984172269701958,
"step": 4615,
"valid_targets_mean": 2829.4,
"valid_targets_min": 614
},
{
"epoch": 3.7594627594627594,
"grad_norm": 0.6031062567308154,
"learning_rate": 2.091675427779052e-05,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125014990568161,
"step": 4620,
"valid_targets_mean": 1989.6,
"valid_targets_min": 608
},
{
"epoch": 3.763532763532764,
"grad_norm": 0.34464040068494,
"learning_rate": 2.0876216503864348e-05,
"loss": 0.0963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03857950493693352,
"step": 4625,
"valid_targets_mean": 3851.4,
"valid_targets_min": 3150
},
{
"epoch": 3.7676027676027677,
"grad_norm": 0.521731284937972,
"learning_rate": 2.0835675122950155e-05,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0498424731194973,
"step": 4630,
"valid_targets_mean": 2037.9,
"valid_targets_min": 718
},
{
"epoch": 3.7716727716727716,
"grad_norm": 0.6148462798244299,
"learning_rate": 2.079513030193852e-05,
"loss": 0.0937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04556414484977722,
"step": 4635,
"valid_targets_mean": 3679.2,
"valid_targets_min": 1333
},
{
"epoch": 3.775742775742776,
"grad_norm": 0.4489274468020415,
"learning_rate": 2.0754582207734163e-05,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0359991192817688,
"step": 4640,
"valid_targets_mean": 1756.9,
"valid_targets_min": 693
},
{
"epoch": 3.77981277981278,
"grad_norm": 0.4685040453171337,
"learning_rate": 2.0714031007255308e-05,
"loss": 0.1217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039639245718717575,
"step": 4645,
"valid_targets_mean": 1352.6,
"valid_targets_min": 803
},
{
"epoch": 3.7838827838827838,
"grad_norm": 0.38901622311150574,
"learning_rate": 2.0673476867432945e-05,
"loss": 0.0985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07358896732330322,
"step": 4650,
"valid_targets_mean": 2522.5,
"valid_targets_min": 902
},
{
"epoch": 3.787952787952788,
"grad_norm": 0.45401232368813943,
"learning_rate": 2.0632919955210177e-05,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044406771659851074,
"step": 4655,
"valid_targets_mean": 3511.5,
"valid_targets_min": 2393
},
{
"epoch": 3.792022792022792,
"grad_norm": 0.33635740471339176,
"learning_rate": 2.0592360437541506e-05,
"loss": 0.0954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03269575536251068,
"step": 4660,
"valid_targets_mean": 3454.1,
"valid_targets_min": 804
},
{
"epoch": 3.796092796092796,
"grad_norm": 0.3694812668687151,
"learning_rate": 2.055179848139217e-05,
"loss": 0.0927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04042567312717438,
"step": 4665,
"valid_targets_mean": 5271.5,
"valid_targets_min": 4147
},
{
"epoch": 3.8001628001628003,
"grad_norm": 0.3719991625867249,
"learning_rate": 2.0511234253737445e-05,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04839537665247917,
"step": 4670,
"valid_targets_mean": 4163.8,
"valid_targets_min": 871
},
{
"epoch": 3.804232804232804,
"grad_norm": 0.38045962863863597,
"learning_rate": 2.047066792156195e-05,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027333011850714684,
"step": 4675,
"valid_targets_mean": 4198.2,
"valid_targets_min": 896
},
{
"epoch": 3.808302808302808,
"grad_norm": 0.34894815665055257,
"learning_rate": 2.0430099651858972e-05,
"loss": 0.0897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046752214431762695,
"step": 4680,
"valid_targets_mean": 3781.4,
"valid_targets_min": 2862
},
{
"epoch": 3.8123728123728124,
"grad_norm": 0.6275665055735403,
"learning_rate": 2.038952961162978e-05,
"loss": 0.109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06374616920948029,
"step": 4685,
"valid_targets_mean": 1718.8,
"valid_targets_min": 497
},
{
"epoch": 3.8164428164428164,
"grad_norm": 0.40826142469048216,
"learning_rate": 2.034895796788292e-05,
"loss": 0.0907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05431363359093666,
"step": 4690,
"valid_targets_mean": 4016.9,
"valid_targets_min": 3217
},
{
"epoch": 3.8205128205128203,
"grad_norm": 0.4250331729338565,
"learning_rate": 2.030838488763355e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03880765289068222,
"step": 4695,
"valid_targets_mean": 2624.6,
"valid_targets_min": 901
},
{
"epoch": 3.8245828245828246,
"grad_norm": 0.39072073946366787,
"learning_rate": 2.0267810537902727e-05,
"loss": 0.0771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04679608345031738,
"step": 4700,
"valid_targets_mean": 3859.0,
"valid_targets_min": 2425
},
{
"epoch": 3.8286528286528285,
"grad_norm": 0.3928920752567127,
"learning_rate": 2.0227235085716754e-05,
"loss": 0.0994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06546978652477264,
"step": 4705,
"valid_targets_mean": 3524.6,
"valid_targets_min": 3017
},
{
"epoch": 3.832722832722833,
"grad_norm": 0.37248107631418687,
"learning_rate": 2.0186658698106445e-05,
"loss": 0.0862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036713846027851105,
"step": 4710,
"valid_targets_mean": 3727.2,
"valid_targets_min": 3184
},
{
"epoch": 3.836792836792837,
"grad_norm": 0.6173637983811905,
"learning_rate": 2.0146081542106502e-05,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0795275866985321,
"step": 4715,
"valid_targets_mean": 2059.5,
"valid_targets_min": 478
},
{
"epoch": 3.840862840862841,
"grad_norm": 0.506439817469206,
"learning_rate": 2.010550378475475e-05,
"loss": 0.0888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050123006105422974,
"step": 4720,
"valid_targets_mean": 1881.8,
"valid_targets_min": 955
},
{
"epoch": 3.844932844932845,
"grad_norm": 0.5407218171773867,
"learning_rate": 2.006492559309152e-05,
"loss": 0.095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0604960098862648,
"step": 4725,
"valid_targets_mean": 1654.2,
"valid_targets_min": 959
},
{
"epoch": 3.849002849002849,
"grad_norm": 0.3651902043497858,
"learning_rate": 2.0024347134158915e-05,
"loss": 0.0999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03338472917675972,
"step": 4730,
"valid_targets_mean": 2815.5,
"valid_targets_min": 748
},
{
"epoch": 3.8530728530728533,
"grad_norm": 0.4855059874008844,
"learning_rate": 1.9983768575000147e-05,
"loss": 0.0909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03731710463762283,
"step": 4735,
"valid_targets_mean": 1247.0,
"valid_targets_min": 495
},
{
"epoch": 3.857142857142857,
"grad_norm": 0.47569854814679674,
"learning_rate": 1.9943190082658827e-05,
"loss": 0.1019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031180473044514656,
"step": 4740,
"valid_targets_mean": 2142.4,
"valid_targets_min": 655
},
{
"epoch": 3.861212861212861,
"grad_norm": 0.6078700792608549,
"learning_rate": 1.9902611824178306e-05,
"loss": 0.1117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.088534876704216,
"step": 4745,
"valid_targets_mean": 2176.2,
"valid_targets_min": 521
},
{
"epoch": 3.8652828652828655,
"grad_norm": 0.3966917197512265,
"learning_rate": 1.986203396660097e-05,
"loss": 0.0864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04920294135808945,
"step": 4750,
"valid_targets_mean": 3740.4,
"valid_targets_min": 2788
},
{
"epoch": 3.8693528693528694,
"grad_norm": 0.3078969308089153,
"learning_rate": 1.9821456676967552e-05,
"loss": 0.0758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03821399807929993,
"step": 4755,
"valid_targets_mean": 3481.5,
"valid_targets_min": 841
},
{
"epoch": 3.8734228734228733,
"grad_norm": 0.41592065293330216,
"learning_rate": 1.9780880122316434e-05,
"loss": 0.0881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04670462757349014,
"step": 4760,
"valid_targets_mean": 2820.0,
"valid_targets_min": 2144
},
{
"epoch": 3.8774928774928776,
"grad_norm": 0.42102684627161313,
"learning_rate": 1.9740304469682987e-05,
"loss": 0.1147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05189353972673416,
"step": 4765,
"valid_targets_mean": 3554.1,
"valid_targets_min": 2619
},
{
"epoch": 3.8815628815628815,
"grad_norm": 0.3289199750652924,
"learning_rate": 1.9699729886098876e-05,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03820990025997162,
"step": 4770,
"valid_targets_mean": 3334.5,
"valid_targets_min": 619
},
{
"epoch": 3.8856328856328854,
"grad_norm": 0.3257554126268986,
"learning_rate": 1.965915653859135e-05,
"loss": 0.0887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038173578679561615,
"step": 4775,
"valid_targets_mean": 4034.9,
"valid_targets_min": 486
},
{
"epoch": 3.88970288970289,
"grad_norm": 0.31496384696830865,
"learning_rate": 1.9618584594182576e-05,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040112294256687164,
"step": 4780,
"valid_targets_mean": 3456.8,
"valid_targets_min": 995
},
{
"epoch": 3.8937728937728937,
"grad_norm": 0.3078455051176223,
"learning_rate": 1.957801421988894e-05,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047052159905433655,
"step": 4785,
"valid_targets_mean": 4773.8,
"valid_targets_min": 3539
},
{
"epoch": 3.8978428978428976,
"grad_norm": 0.3723134741147702,
"learning_rate": 1.9537445582720385e-05,
"loss": 0.0946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05127771943807602,
"step": 4790,
"valid_targets_mean": 4328.5,
"valid_targets_min": 3172
},
{
"epoch": 3.901912901912902,
"grad_norm": 0.306985867833895,
"learning_rate": 1.9496878849679667e-05,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02703310176730156,
"step": 4795,
"valid_targets_mean": 2120.1,
"valid_targets_min": 549
},
{
"epoch": 3.905982905982906,
"grad_norm": 0.3994634886270254,
"learning_rate": 1.9456314187761726e-05,
"loss": 0.1164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053539011627435684,
"step": 4800,
"valid_targets_mean": 2216.2,
"valid_targets_min": 541
},
{
"epoch": 3.91005291005291,
"grad_norm": 0.3309405585861779,
"learning_rate": 1.941575176395298e-05,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029777104035019875,
"step": 4805,
"valid_targets_mean": 3338.9,
"valid_targets_min": 1938
},
{
"epoch": 3.914122914122914,
"grad_norm": 0.4467641072962703,
"learning_rate": 1.937519174523063e-05,
"loss": 0.0891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12722966074943542,
"step": 4810,
"valid_targets_mean": 2226.6,
"valid_targets_min": 1167
},
{
"epoch": 3.918192918192918,
"grad_norm": 0.390118295374521,
"learning_rate": 1.9334634298561962e-05,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043785303831100464,
"step": 4815,
"valid_targets_mean": 3561.4,
"valid_targets_min": 2919
},
{
"epoch": 3.9222629222629224,
"grad_norm": 0.40458656901794954,
"learning_rate": 1.9294079590903697e-05,
"loss": 0.086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03705420717597008,
"step": 4820,
"valid_targets_mean": 1509.9,
"valid_targets_min": 559
},
{
"epoch": 3.9263329263329263,
"grad_norm": 0.525559021088802,
"learning_rate": 1.925352778920126e-05,
"loss": 0.09,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06773480027914047,
"step": 4825,
"valid_targets_mean": 3123.1,
"valid_targets_min": 883
},
{
"epoch": 3.9304029304029307,
"grad_norm": 0.7659028123265849,
"learning_rate": 1.9212979060388136e-05,
"loss": 0.1144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07741884142160416,
"step": 4830,
"valid_targets_mean": 1419.0,
"valid_targets_min": 337
},
{
"epoch": 3.9344729344729346,
"grad_norm": 0.37012249374521133,
"learning_rate": 1.917243357138514e-05,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03321508690714836,
"step": 4835,
"valid_targets_mean": 2953.9,
"valid_targets_min": 593
},
{
"epoch": 3.9385429385429385,
"grad_norm": 0.38243163663291685,
"learning_rate": 1.9131891489099745e-05,
"loss": 0.0949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04113879054784775,
"step": 4840,
"valid_targets_mean": 3091.9,
"valid_targets_min": 529
},
{
"epoch": 3.942612942612943,
"grad_norm": 0.4160846401676222,
"learning_rate": 1.9091352980425427e-05,
"loss": 0.0951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05502070114016533,
"step": 4845,
"valid_targets_mean": 3593.4,
"valid_targets_min": 2556
},
{
"epoch": 3.9466829466829467,
"grad_norm": 0.44382246740561504,
"learning_rate": 1.9050818212240937e-05,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05704183131456375,
"step": 4850,
"valid_targets_mean": 3753.2,
"valid_targets_min": 3385
},
{
"epoch": 3.9507529507529506,
"grad_norm": 0.3788947152767503,
"learning_rate": 1.9010287351409617e-05,
"loss": 0.0822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03963714465498924,
"step": 4855,
"valid_targets_mean": 3442.1,
"valid_targets_min": 932
},
{
"epoch": 3.954822954822955,
"grad_norm": 0.6893550041691463,
"learning_rate": 1.896976056477874e-05,
"loss": 0.0852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05745682120323181,
"step": 4860,
"valid_targets_mean": 1202.9,
"valid_targets_min": 598
},
{
"epoch": 3.958892958892959,
"grad_norm": 0.48501252893743335,
"learning_rate": 1.892923801917881e-05,
"loss": 0.0978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04939830303192139,
"step": 4865,
"valid_targets_mean": 3333.5,
"valid_targets_min": 1069
},
{
"epoch": 3.962962962962963,
"grad_norm": 1.5705058397396339,
"learning_rate": 1.888871988142285e-05,
"loss": 0.0818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036230284720659256,
"step": 4870,
"valid_targets_mean": 1234.5,
"valid_targets_min": 680
},
{
"epoch": 3.967032967032967,
"grad_norm": 0.38273222211564595,
"learning_rate": 1.8848206318305762e-05,
"loss": 0.0806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038350578397512436,
"step": 4875,
"valid_targets_mean": 2762.4,
"valid_targets_min": 774
},
{
"epoch": 3.971102971102971,
"grad_norm": 0.3525402431797138,
"learning_rate": 1.8807697496603604e-05,
"loss": 0.0942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04092249274253845,
"step": 4880,
"valid_targets_mean": 3842.5,
"valid_targets_min": 720
},
{
"epoch": 3.975172975172975,
"grad_norm": 0.23643952371340574,
"learning_rate": 1.8767193583072917e-05,
"loss": 0.0754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03318733721971512,
"step": 4885,
"valid_targets_mean": 5590.6,
"valid_targets_min": 4657
},
{
"epoch": 3.9792429792429793,
"grad_norm": 0.34030143973987964,
"learning_rate": 1.8726694744450046e-05,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04707394912838936,
"step": 4890,
"valid_targets_mean": 4327.4,
"valid_targets_min": 1320
},
{
"epoch": 3.9833129833129832,
"grad_norm": 0.3472447381234327,
"learning_rate": 1.868620114745043e-05,
"loss": 0.0863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04898809269070625,
"step": 4895,
"valid_targets_mean": 3547.8,
"valid_targets_min": 2463
},
{
"epoch": 3.987382987382987,
"grad_norm": 0.416132959419297,
"learning_rate": 1.8645712958767936e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031941697001457214,
"step": 4900,
"valid_targets_mean": 2903.5,
"valid_targets_min": 605
},
{
"epoch": 3.9914529914529915,
"grad_norm": 0.33752542112182116,
"learning_rate": 1.8605230345074187e-05,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035623304545879364,
"step": 4905,
"valid_targets_mean": 3095.8,
"valid_targets_min": 1014
},
{
"epoch": 3.9955229955229954,
"grad_norm": 0.35702567633782445,
"learning_rate": 1.8564753473017815e-05,
"loss": 0.0926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04029485583305359,
"step": 4910,
"valid_targets_mean": 3526.4,
"valid_targets_min": 2807
},
{
"epoch": 3.9995929995929997,
"grad_norm": 0.4652040750909582,
"learning_rate": 1.8524282509223857e-05,
"loss": 0.1126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09600470215082169,
"step": 4915,
"valid_targets_mean": 3006.5,
"valid_targets_min": 1214
},
{
"epoch": 4.003256003256003,
"grad_norm": 0.6419873740137033,
"learning_rate": 1.8483817620293002e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15491032600402832,
"step": 4920,
"valid_targets_mean": 8029.9,
"valid_targets_min": 6142
},
{
"epoch": 4.007326007326007,
"grad_norm": 0.4261293015569112,
"learning_rate": 1.8443358972800943e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09373286366462708,
"step": 4925,
"valid_targets_mean": 6664.0,
"valid_targets_min": 5470
},
{
"epoch": 4.011396011396012,
"grad_norm": 0.43569183179763055,
"learning_rate": 1.8402906733297686e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09796077013015747,
"step": 4930,
"valid_targets_mean": 7126.9,
"valid_targets_min": 5368
},
{
"epoch": 4.015466015466015,
"grad_norm": 0.3628222940332491,
"learning_rate": 1.836246106830684e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08767811954021454,
"step": 4935,
"valid_targets_mean": 7634.9,
"valid_targets_min": 5614
},
{
"epoch": 4.0195360195360195,
"grad_norm": 0.41186264281524637,
"learning_rate": 1.832202214432497e-05,
"loss": 0.1851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08911505341529846,
"step": 4940,
"valid_targets_mean": 8630.8,
"valid_targets_min": 6362
},
{
"epoch": 4.023606023606024,
"grad_norm": 0.39527021624678743,
"learning_rate": 1.828159012782087e-05,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09319797903299332,
"step": 4945,
"valid_targets_mean": 7383.6,
"valid_targets_min": 5844
},
{
"epoch": 4.027676027676027,
"grad_norm": 0.3825769189458071,
"learning_rate": 1.824116518523492e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1047782227396965,
"step": 4950,
"valid_targets_mean": 8017.0,
"valid_targets_min": 5283
},
{
"epoch": 4.031746031746032,
"grad_norm": 0.37851649415828814,
"learning_rate": 1.8200747482978358e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07832890748977661,
"step": 4955,
"valid_targets_mean": 7051.1,
"valid_targets_min": 4135
},
{
"epoch": 4.035816035816036,
"grad_norm": 0.3899190146807035,
"learning_rate": 1.8160337187432637e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07594281435012817,
"step": 4960,
"valid_targets_mean": 5370.4,
"valid_targets_min": 3919
},
{
"epoch": 4.0398860398860394,
"grad_norm": 0.3710326532028934,
"learning_rate": 1.8119934464948713e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07691587507724762,
"step": 4965,
"valid_targets_mean": 6063.6,
"valid_targets_min": 4863
},
{
"epoch": 4.043956043956044,
"grad_norm": 0.425559143325838,
"learning_rate": 1.8079539481846366e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08631320297718048,
"step": 4970,
"valid_targets_mean": 7001.2,
"valid_targets_min": 6020
},
{
"epoch": 4.048026048026048,
"grad_norm": 0.3800530976695048,
"learning_rate": 1.8039152404413513e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08500252664089203,
"step": 4975,
"valid_targets_mean": 6181.9,
"valid_targets_min": 4669
},
{
"epoch": 4.0520960520960525,
"grad_norm": 0.37536923845620823,
"learning_rate": 1.7998773398905536e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07884109765291214,
"step": 4980,
"valid_targets_mean": 6250.2,
"valid_targets_min": 4900
},
{
"epoch": 4.056166056166056,
"grad_norm": 0.369134672032628,
"learning_rate": 1.795840263154457e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0790032371878624,
"step": 4985,
"valid_targets_mean": 7156.4,
"valid_targets_min": 5323
},
{
"epoch": 4.06023606023606,
"grad_norm": 0.3823541536796184,
"learning_rate": 1.7918040268518863e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08844245970249176,
"step": 4990,
"valid_targets_mean": 7215.8,
"valid_targets_min": 4720
},
{
"epoch": 4.064306064306065,
"grad_norm": 0.3864166564460856,
"learning_rate": 1.7877686475982045e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08641092479228973,
"step": 4995,
"valid_targets_mean": 6550.8,
"valid_targets_min": 5739
},
{
"epoch": 4.068376068376068,
"grad_norm": 0.3793296622743899,
"learning_rate": 1.783734142005248e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0891452431678772,
"step": 5000,
"valid_targets_mean": 6726.8,
"valid_targets_min": 4540
},
{
"epoch": 4.0724460724460725,
"grad_norm": 0.4723995482127612,
"learning_rate": 1.7797005266812556e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0973764955997467,
"step": 5005,
"valid_targets_mean": 4573.4,
"valid_targets_min": 1039
},
{
"epoch": 4.076516076516077,
"grad_norm": 0.41477705618237604,
"learning_rate": 1.7756678182308018e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08957439661026001,
"step": 5010,
"valid_targets_mean": 6430.0,
"valid_targets_min": 5412
},
{
"epoch": 4.08058608058608,
"grad_norm": 0.6352736728460759,
"learning_rate": 1.7716360332547286e-05,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025655508041381836,
"step": 5015,
"valid_targets_mean": 583.1,
"valid_targets_min": 158
},
{
"epoch": 4.084656084656085,
"grad_norm": 0.3748310581528748,
"learning_rate": 1.7676051883500746e-05,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09119533747434616,
"step": 5020,
"valid_targets_mean": 8230.9,
"valid_targets_min": 5061
},
{
"epoch": 4.088726088726089,
"grad_norm": 0.4146647677224428,
"learning_rate": 1.76357530011001e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09562458842992783,
"step": 5025,
"valid_targets_mean": 7238.9,
"valid_targets_min": 5112
},
{
"epoch": 4.0927960927960925,
"grad_norm": 0.3895491315857082,
"learning_rate": 1.7595463851237666e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07687856256961823,
"step": 5030,
"valid_targets_mean": 6322.8,
"valid_targets_min": 4867
},
{
"epoch": 4.096866096866097,
"grad_norm": 0.3535398598607784,
"learning_rate": 1.7555184599765697e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08618101477622986,
"step": 5035,
"valid_targets_mean": 7887.0,
"valid_targets_min": 6004
},
{
"epoch": 4.100936100936101,
"grad_norm": 0.3398185270105302,
"learning_rate": 1.7514915412495696e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07757728546857834,
"step": 5040,
"valid_targets_mean": 7090.2,
"valid_targets_min": 4917
},
{
"epoch": 4.105006105006105,
"grad_norm": 0.3735006074847723,
"learning_rate": 1.7474656455197746e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08108969032764435,
"step": 5045,
"valid_targets_mean": 7441.9,
"valid_targets_min": 4202
},
{
"epoch": 4.109076109076109,
"grad_norm": 0.3963767640674053,
"learning_rate": 1.7434407893599803e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08019435405731201,
"step": 5050,
"valid_targets_mean": 7901.8,
"valid_targets_min": 5060
},
{
"epoch": 4.113146113146113,
"grad_norm": 0.3279720037805319,
"learning_rate": 1.7394169893387044e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07386630773544312,
"step": 5055,
"valid_targets_mean": 8557.6,
"valid_targets_min": 6331
},
{
"epoch": 4.117216117216117,
"grad_norm": 0.43210024185743623,
"learning_rate": 1.735394262020115e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08315213024616241,
"step": 5060,
"valid_targets_mean": 4976.4,
"valid_targets_min": 2847
},
{
"epoch": 4.121286121286121,
"grad_norm": 0.47219602019627277,
"learning_rate": 1.7313726239639662e-05,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09470256417989731,
"step": 5065,
"valid_targets_mean": 7129.1,
"valid_targets_min": 5331
},
{
"epoch": 4.1253561253561255,
"grad_norm": 0.43079423430747293,
"learning_rate": 1.7273520917255277e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09296290576457977,
"step": 5070,
"valid_targets_mean": 6864.0,
"valid_targets_min": 4697
},
{
"epoch": 4.12942612942613,
"grad_norm": 0.43490675675482465,
"learning_rate": 1.7233326818555162e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0889597162604332,
"step": 5075,
"valid_targets_mean": 6631.9,
"valid_targets_min": 4623
},
{
"epoch": 4.133496133496133,
"grad_norm": 0.3756096966590715,
"learning_rate": 1.7193144109000286e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08131799101829529,
"step": 5080,
"valid_targets_mean": 6330.4,
"valid_targets_min": 5424
},
{
"epoch": 4.137566137566138,
"grad_norm": 0.3746393665646649,
"learning_rate": 1.7152972954004745e-05,
"loss": 0.1741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08426746726036072,
"step": 5085,
"valid_targets_mean": 6814.8,
"valid_targets_min": 4964
},
{
"epoch": 4.141636141636142,
"grad_norm": 0.4195480953550515,
"learning_rate": 1.711281351893505e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0972888171672821,
"step": 5090,
"valid_targets_mean": 6915.8,
"valid_targets_min": 5321
},
{
"epoch": 4.1457061457061455,
"grad_norm": 0.4316053213116156,
"learning_rate": 1.7072665969109485e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08947832882404327,
"step": 5095,
"valid_targets_mean": 6464.5,
"valid_targets_min": 5185
},
{
"epoch": 4.14977614977615,
"grad_norm": 0.39114306149720146,
"learning_rate": 1.703253046979739e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09024079144001007,
"step": 5100,
"valid_targets_mean": 7048.6,
"valid_targets_min": 4913
},
{
"epoch": 4.153846153846154,
"grad_norm": 0.4185179236015934,
"learning_rate": 1.6992407186218512e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09964226186275482,
"step": 5105,
"valid_targets_mean": 7469.2,
"valid_targets_min": 5426
},
{
"epoch": 4.157916157916158,
"grad_norm": 0.40064531771229606,
"learning_rate": 1.6952296283542303e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09262304753065109,
"step": 5110,
"valid_targets_mean": 6819.4,
"valid_targets_min": 5286
},
{
"epoch": 4.161986161986162,
"grad_norm": 0.38311400379103405,
"learning_rate": 1.691219792688726e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09319957345724106,
"step": 5115,
"valid_targets_mean": 7107.5,
"valid_targets_min": 5201
},
{
"epoch": 4.166056166056166,
"grad_norm": 0.3933047787302955,
"learning_rate": 1.6872112281320218e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08465088903903961,
"step": 5120,
"valid_targets_mean": 5642.6,
"valid_targets_min": 4838
},
{
"epoch": 4.17012617012617,
"grad_norm": 0.8525985607334213,
"learning_rate": 1.6832039511855702e-05,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13957032561302185,
"step": 5125,
"valid_targets_mean": 2054.1,
"valid_targets_min": 134
},
{
"epoch": 4.174196174196174,
"grad_norm": 0.4350065324995063,
"learning_rate": 1.6791979783455227e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08149752765893936,
"step": 5130,
"valid_targets_mean": 6686.4,
"valid_targets_min": 5256
},
{
"epoch": 4.1782661782661785,
"grad_norm": 0.4132065668153816,
"learning_rate": 1.6751933261026604e-05,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09279554337263107,
"step": 5135,
"valid_targets_mean": 6216.6,
"valid_targets_min": 5542
},
{
"epoch": 4.182336182336182,
"grad_norm": 0.4704024966834831,
"learning_rate": 1.671190010942331e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08651970326900482,
"step": 5140,
"valid_targets_mean": 6486.1,
"valid_targets_min": 5531
},
{
"epoch": 4.186406186406186,
"grad_norm": 0.41768609875122026,
"learning_rate": 1.667188049344377e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08536796271800995,
"step": 5145,
"valid_targets_mean": 5797.4,
"valid_targets_min": 3911
},
{
"epoch": 4.190476190476191,
"grad_norm": 0.44999542060640974,
"learning_rate": 1.663187457783068e-05,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08768117427825928,
"step": 5150,
"valid_targets_mean": 6357.5,
"valid_targets_min": 5195
},
{
"epoch": 4.194546194546194,
"grad_norm": 0.4473459694163714,
"learning_rate": 1.659188252727035e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08737886697053909,
"step": 5155,
"valid_targets_mean": 5808.9,
"valid_targets_min": 4959
},
{
"epoch": 4.1986161986161985,
"grad_norm": 0.5313940009593219,
"learning_rate": 1.6551904506392008e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05604414641857147,
"step": 5160,
"valid_targets_mean": 2591.5,
"valid_targets_min": 842
},
{
"epoch": 4.202686202686203,
"grad_norm": 0.4458022538668301,
"learning_rate": 1.651194067976713e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08318484574556351,
"step": 5165,
"valid_targets_mean": 6006.9,
"valid_targets_min": 4769
},
{
"epoch": 4.206756206756207,
"grad_norm": 0.4421797804474541,
"learning_rate": 1.6471991211908768e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08438228070735931,
"step": 5170,
"valid_targets_mean": 6764.2,
"valid_targets_min": 5046
},
{
"epoch": 4.210826210826211,
"grad_norm": 0.44259170394302194,
"learning_rate": 1.6432056267270836e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09295166283845901,
"step": 5175,
"valid_targets_mean": 6055.8,
"valid_targets_min": 5182
},
{
"epoch": 4.214896214896215,
"grad_norm": 0.4174437145697535,
"learning_rate": 1.6392136010247496e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08445718884468079,
"step": 5180,
"valid_targets_mean": 7101.6,
"valid_targets_min": 5366
},
{
"epoch": 4.218966218966219,
"grad_norm": 0.39047654580039387,
"learning_rate": 1.6352230605172438e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08764854073524475,
"step": 5185,
"valid_targets_mean": 7111.9,
"valid_targets_min": 5192
},
{
"epoch": 4.223036223036223,
"grad_norm": 0.44083057032394674,
"learning_rate": 1.63123402163182e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08842865377664566,
"step": 5190,
"valid_targets_mean": 5509.9,
"valid_targets_min": 4790
},
{
"epoch": 4.227106227106227,
"grad_norm": 0.9039249010855949,
"learning_rate": 1.6272465007895528e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09698623418807983,
"step": 5195,
"valid_targets_mean": 1581.9,
"valid_targets_min": 864
},
{
"epoch": 4.2311762311762315,
"grad_norm": 0.6984318659356797,
"learning_rate": 1.623260514405266e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07721932977437973,
"step": 5200,
"valid_targets_mean": 1333.2,
"valid_targets_min": 632
},
{
"epoch": 4.235246235246235,
"grad_norm": 0.7988165421330412,
"learning_rate": 1.619276078887467e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0798022449016571,
"step": 5205,
"valid_targets_mean": 1602.9,
"valid_targets_min": 875
},
{
"epoch": 4.239316239316239,
"grad_norm": 0.8839676972961594,
"learning_rate": 1.6152932106382795e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07965122908353806,
"step": 5210,
"valid_targets_mean": 1340.4,
"valid_targets_min": 701
},
{
"epoch": 4.243386243386244,
"grad_norm": 0.7568566322974944,
"learning_rate": 1.6113119260533743e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08617518842220306,
"step": 5215,
"valid_targets_mean": 1792.9,
"valid_targets_min": 898
},
{
"epoch": 4.247456247456247,
"grad_norm": 0.7853461839643316,
"learning_rate": 1.6073322415219045e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07748760282993317,
"step": 5220,
"valid_targets_mean": 1433.1,
"valid_targets_min": 1070
},
{
"epoch": 4.2515262515262515,
"grad_norm": 0.775021891537993,
"learning_rate": 1.6033541734264358e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07678981870412827,
"step": 5225,
"valid_targets_mean": 1589.5,
"valid_targets_min": 970
},
{
"epoch": 4.255596255596256,
"grad_norm": 0.7698989145856481,
"learning_rate": 1.5993777381428792e-05,
"loss": 0.1352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06523817032575607,
"step": 5230,
"valid_targets_mean": 1270.5,
"valid_targets_min": 648
},
{
"epoch": 4.259666259666259,
"grad_norm": 0.7897405384596183,
"learning_rate": 1.5954029520404252e-05,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08299176394939423,
"step": 5235,
"valid_targets_mean": 1674.5,
"valid_targets_min": 727
},
{
"epoch": 4.263736263736264,
"grad_norm": 0.7201703295282144,
"learning_rate": 1.5914298314814752e-05,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05681309849023819,
"step": 5240,
"valid_targets_mean": 1406.0,
"valid_targets_min": 770
},
{
"epoch": 4.267806267806268,
"grad_norm": 0.8007703569426596,
"learning_rate": 1.587458392821574e-05,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0649387463927269,
"step": 5245,
"valid_targets_mean": 1381.2,
"valid_targets_min": 572
},
{
"epoch": 4.2718762718762715,
"grad_norm": 0.770739474815444,
"learning_rate": 1.5834886524093415e-05,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08127094060182571,
"step": 5250,
"valid_targets_mean": 1580.4,
"valid_targets_min": 633
},
{
"epoch": 4.275946275946276,
"grad_norm": 0.8368026866328528,
"learning_rate": 1.5795206265864086e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0783461183309555,
"step": 5255,
"valid_targets_mean": 1478.8,
"valid_targets_min": 923
},
{
"epoch": 4.28001628001628,
"grad_norm": 0.7152654874841173,
"learning_rate": 1.575554331687348e-05,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06594514846801758,
"step": 5260,
"valid_targets_mean": 1401.0,
"valid_targets_min": 740
},
{
"epoch": 4.284086284086284,
"grad_norm": 0.7469453449896892,
"learning_rate": 1.5715897840396056e-05,
"loss": 0.1379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06428131461143494,
"step": 5265,
"valid_targets_mean": 1588.9,
"valid_targets_min": 870
},
{
"epoch": 4.288156288156288,
"grad_norm": 0.7630766511387223,
"learning_rate": 1.5676269999634355e-05,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10081503540277481,
"step": 5270,
"valid_targets_mean": 2008.4,
"valid_targets_min": 1042
},
{
"epoch": 4.292226292226292,
"grad_norm": 0.7719765796935957,
"learning_rate": 1.5636659957718317e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058920711278915405,
"step": 5275,
"valid_targets_mean": 1209.0,
"valid_targets_min": 870
},
{
"epoch": 4.296296296296296,
"grad_norm": 0.7392001894065844,
"learning_rate": 1.5597067877704627e-05,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07120724767446518,
"step": 5280,
"valid_targets_mean": 1535.5,
"valid_targets_min": 740
},
{
"epoch": 4.3003663003663,
"grad_norm": 0.6940002890801722,
"learning_rate": 1.5557493922576e-05,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07191811501979828,
"step": 5285,
"valid_targets_mean": 1642.9,
"valid_targets_min": 906
},
{
"epoch": 4.3044363044363045,
"grad_norm": 0.7996020542171901,
"learning_rate": 1.5517938255240558e-05,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07438832521438599,
"step": 5290,
"valid_targets_mean": 1570.5,
"valid_targets_min": 814
},
{
"epoch": 4.308506308506309,
"grad_norm": 0.7539368794630141,
"learning_rate": 1.5478401038531132e-05,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06699814647436142,
"step": 5295,
"valid_targets_mean": 1722.1,
"valid_targets_min": 832
},
{
"epoch": 4.312576312576312,
"grad_norm": 0.6917100664184215,
"learning_rate": 1.543888243520462e-05,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05670752376317978,
"step": 5300,
"valid_targets_mean": 1453.5,
"valid_targets_min": 891
},
{
"epoch": 4.316646316646317,
"grad_norm": 0.9493477730431549,
"learning_rate": 1.5399382607941267e-05,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08421558141708374,
"step": 5305,
"valid_targets_mean": 1584.4,
"valid_targets_min": 734
},
{
"epoch": 4.320716320716321,
"grad_norm": 0.7583084640701927,
"learning_rate": 1.535990171934405e-05,
"loss": 0.1323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06385685503482819,
"step": 5310,
"valid_targets_mean": 1495.2,
"valid_targets_min": 737
},
{
"epoch": 4.3247863247863245,
"grad_norm": 0.8067972324986055,
"learning_rate": 1.5320439931937968e-05,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07771594822406769,
"step": 5315,
"valid_targets_mean": 1737.0,
"valid_targets_min": 872
},
{
"epoch": 4.328856328856329,
"grad_norm": 0.791867781812196,
"learning_rate": 1.5280997408169412e-05,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07138702273368835,
"step": 5320,
"valid_targets_mean": 1431.6,
"valid_targets_min": 805
},
{
"epoch": 4.332926332926333,
"grad_norm": 0.7550711735218681,
"learning_rate": 1.5241574310405437e-05,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08015383780002594,
"step": 5325,
"valid_targets_mean": 2060.2,
"valid_targets_min": 1253
},
{
"epoch": 4.336996336996337,
"grad_norm": 0.8677822625949797,
"learning_rate": 1.5202170800933157e-05,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0818401500582695,
"step": 5330,
"valid_targets_mean": 2063.9,
"valid_targets_min": 1264
},
{
"epoch": 4.341066341066341,
"grad_norm": 0.7474043536365914,
"learning_rate": 1.516278704195904e-05,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05221828818321228,
"step": 5335,
"valid_targets_mean": 1036.5,
"valid_targets_min": 613
},
{
"epoch": 4.345136345136345,
"grad_norm": 0.7889949523343204,
"learning_rate": 1.512342319560826e-05,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06708300858736038,
"step": 5340,
"valid_targets_mean": 1674.4,
"valid_targets_min": 768
},
{
"epoch": 4.349206349206349,
"grad_norm": 0.7873060459244604,
"learning_rate": 1.5084079423924008e-05,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0583968311548233,
"step": 5345,
"valid_targets_mean": 1249.8,
"valid_targets_min": 714
},
{
"epoch": 4.353276353276353,
"grad_norm": 0.7925060855022024,
"learning_rate": 1.5044755888866838e-05,
"loss": 0.144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05081354081630707,
"step": 5350,
"valid_targets_mean": 1114.8,
"valid_targets_min": 800
},
{
"epoch": 4.357346357346358,
"grad_norm": 0.780052779669191,
"learning_rate": 1.5005452752314016e-05,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0766829401254654,
"step": 5355,
"valid_targets_mean": 1780.9,
"valid_targets_min": 933
},
{
"epoch": 4.361416361416361,
"grad_norm": 0.8731555755183956,
"learning_rate": 1.4966170176058804e-05,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06203790381550789,
"step": 5360,
"valid_targets_mean": 1113.6,
"valid_targets_min": 746
},
{
"epoch": 4.365486365486365,
"grad_norm": 0.8105488638885902,
"learning_rate": 1.4926908321809856e-05,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06966659426689148,
"step": 5365,
"valid_targets_mean": 1265.0,
"valid_targets_min": 814
},
{
"epoch": 4.36955636955637,
"grad_norm": 0.7570799683681111,
"learning_rate": 1.4887667351190508e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07910779118537903,
"step": 5370,
"valid_targets_mean": 1652.1,
"valid_targets_min": 635
},
{
"epoch": 4.373626373626374,
"grad_norm": 0.8373628622647403,
"learning_rate": 1.4848447425738135e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05490382760763168,
"step": 5375,
"valid_targets_mean": 1231.2,
"valid_targets_min": 739
},
{
"epoch": 4.3776963776963775,
"grad_norm": 0.7459004049358479,
"learning_rate": 1.4809248706903476e-05,
"loss": 0.134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0814879834651947,
"step": 5380,
"valid_targets_mean": 1682.4,
"valid_targets_min": 831
},
{
"epoch": 4.381766381766382,
"grad_norm": 0.7901027972617194,
"learning_rate": 1.4770071356049966e-05,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06546150892972946,
"step": 5385,
"valid_targets_mean": 1571.6,
"valid_targets_min": 1015
},
{
"epoch": 4.385836385836386,
"grad_norm": 0.7459849965828421,
"learning_rate": 1.4730915534453084e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059574246406555176,
"step": 5390,
"valid_targets_mean": 1276.8,
"valid_targets_min": 711
},
{
"epoch": 4.38990638990639,
"grad_norm": 0.7250412854507754,
"learning_rate": 1.4691781403299695e-05,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04473428428173065,
"step": 5395,
"valid_targets_mean": 1147.5,
"valid_targets_min": 733
},
{
"epoch": 4.393976393976394,
"grad_norm": 0.9341622348888069,
"learning_rate": 1.4652669123687335e-05,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08530112355947495,
"step": 5400,
"valid_targets_mean": 1604.0,
"valid_targets_min": 953
},
{
"epoch": 4.398046398046398,
"grad_norm": 0.7506012218410362,
"learning_rate": 1.4613578856623634e-05,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0721062421798706,
"step": 5405,
"valid_targets_mean": 1784.0,
"valid_targets_min": 1011
},
{
"epoch": 4.402116402116402,
"grad_norm": 0.9539670072016909,
"learning_rate": 1.4574510763025571e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09979036450386047,
"step": 5410,
"valid_targets_mean": 1729.0,
"valid_targets_min": 1143
},
{
"epoch": 4.406186406186406,
"grad_norm": 0.8152959339758997,
"learning_rate": 1.4535465003718872e-05,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06546957790851593,
"step": 5415,
"valid_targets_mean": 1483.9,
"valid_targets_min": 699
},
{
"epoch": 4.410256410256411,
"grad_norm": 1.0303278083543088,
"learning_rate": 1.4496441739437308e-05,
"loss": 0.1309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059898581355810165,
"step": 5420,
"valid_targets_mean": 1198.4,
"valid_targets_min": 680
},
{
"epoch": 4.414326414326414,
"grad_norm": 0.8198228481186385,
"learning_rate": 1.445744113082205e-05,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06732296943664551,
"step": 5425,
"valid_targets_mean": 1365.2,
"valid_targets_min": 687
},
{
"epoch": 4.418396418396418,
"grad_norm": 0.9913925030956331,
"learning_rate": 1.4418463338421014e-05,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05075017362833023,
"step": 5430,
"valid_targets_mean": 1142.9,
"valid_targets_min": 835
},
{
"epoch": 4.422466422466423,
"grad_norm": 0.8461959968216606,
"learning_rate": 1.4379508522688172e-05,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06075669825077057,
"step": 5435,
"valid_targets_mean": 1316.9,
"valid_targets_min": 829
},
{
"epoch": 4.426536426536426,
"grad_norm": 0.7557942053954224,
"learning_rate": 1.4340576843982941e-05,
"loss": 0.1279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07234987616539001,
"step": 5440,
"valid_targets_mean": 1739.2,
"valid_targets_min": 1138
},
{
"epoch": 4.430606430606431,
"grad_norm": 0.7526966602303533,
"learning_rate": 1.4301668462569463e-05,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06122884154319763,
"step": 5445,
"valid_targets_mean": 1592.2,
"valid_targets_min": 1174
},
{
"epoch": 4.434676434676435,
"grad_norm": 0.7785215289541277,
"learning_rate": 1.4262783538615997e-05,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06840664893388748,
"step": 5450,
"valid_targets_mean": 1543.1,
"valid_targets_min": 554
},
{
"epoch": 4.438746438746438,
"grad_norm": 0.8035141393477653,
"learning_rate": 1.4223922232194231e-05,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06752649694681168,
"step": 5455,
"valid_targets_mean": 1430.0,
"valid_targets_min": 843
},
{
"epoch": 4.442816442816443,
"grad_norm": 0.680868471747835,
"learning_rate": 1.4185084703278636e-05,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06250318884849548,
"step": 5460,
"valid_targets_mean": 1622.9,
"valid_targets_min": 849
},
{
"epoch": 4.446886446886447,
"grad_norm": 0.8578202447129205,
"learning_rate": 1.4146271111745785e-05,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06331510841846466,
"step": 5465,
"valid_targets_mean": 1429.0,
"valid_targets_min": 612
},
{
"epoch": 4.4509564509564505,
"grad_norm": 0.8243591653669494,
"learning_rate": 1.4107481617373738e-05,
"loss": 0.1366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05521140247583389,
"step": 5470,
"valid_targets_mean": 1283.0,
"valid_targets_min": 782
},
{
"epoch": 4.455026455026455,
"grad_norm": 0.8492636328085363,
"learning_rate": 1.406871637984132e-05,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07561201602220535,
"step": 5475,
"valid_targets_mean": 1457.0,
"valid_targets_min": 926
},
{
"epoch": 4.459096459096459,
"grad_norm": 0.7560434633983276,
"learning_rate": 1.4029975558727546e-05,
"loss": 0.1292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05740554630756378,
"step": 5480,
"valid_targets_mean": 1399.6,
"valid_targets_min": 822
},
{
"epoch": 4.463166463166463,
"grad_norm": 0.7108917719684089,
"learning_rate": 1.399125931351088e-05,
"loss": 0.1241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060493603348731995,
"step": 5485,
"valid_targets_mean": 1464.6,
"valid_targets_min": 670
},
{
"epoch": 4.467236467236467,
"grad_norm": 0.8373770508282027,
"learning_rate": 1.3952567803568648e-05,
"loss": 0.1383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06813108921051025,
"step": 5490,
"valid_targets_mean": 1504.8,
"valid_targets_min": 647
},
{
"epoch": 4.471306471306471,
"grad_norm": 0.7967991746334874,
"learning_rate": 1.391390118817634e-05,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051831118762493134,
"step": 5495,
"valid_targets_mean": 1276.9,
"valid_targets_min": 791
},
{
"epoch": 4.475376475376476,
"grad_norm": 0.8724038689238638,
"learning_rate": 1.3875259626506958e-05,
"loss": 0.1294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058950334787368774,
"step": 5500,
"valid_targets_mean": 1291.4,
"valid_targets_min": 746
},
{
"epoch": 4.479446479446479,
"grad_norm": 0.8243173279519246,
"learning_rate": 1.383664327763039e-05,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05535842478275299,
"step": 5505,
"valid_targets_mean": 1409.1,
"valid_targets_min": 892
},
{
"epoch": 4.483516483516484,
"grad_norm": 0.8045208272162921,
"learning_rate": 1.3798052300512707e-05,
"loss": 0.1382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07621202617883682,
"step": 5510,
"valid_targets_mean": 1581.9,
"valid_targets_min": 914
},
{
"epoch": 4.487586487586488,
"grad_norm": 0.8000566735592727,
"learning_rate": 1.3759486854015558e-05,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06206750124692917,
"step": 5515,
"valid_targets_mean": 1647.6,
"valid_targets_min": 636
},
{
"epoch": 4.491656491656491,
"grad_norm": 0.841307842616834,
"learning_rate": 1.3720947096895487e-05,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06576070189476013,
"step": 5520,
"valid_targets_mean": 1523.5,
"valid_targets_min": 641
},
{
"epoch": 4.495726495726496,
"grad_norm": 0.8127961832136743,
"learning_rate": 1.3682433187803283e-05,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07405531406402588,
"step": 5525,
"valid_targets_mean": 1629.4,
"valid_targets_min": 1020
},
{
"epoch": 4.4997964997965,
"grad_norm": 0.8576090738580665,
"learning_rate": 1.3643945285283336e-05,
"loss": 0.1305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05857028067111969,
"step": 5530,
"valid_targets_mean": 1163.4,
"valid_targets_min": 729
},
{
"epoch": 4.503866503866504,
"grad_norm": 0.8768940435922552,
"learning_rate": 1.3605483547772977e-05,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08095380663871765,
"step": 5535,
"valid_targets_mean": 1613.2,
"valid_targets_min": 1001
},
{
"epoch": 4.507936507936508,
"grad_norm": 0.8051072533291032,
"learning_rate": 1.3567048133601821e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06716311722993851,
"step": 5540,
"valid_targets_mean": 1567.0,
"valid_targets_min": 1175
},
{
"epoch": 4.512006512006512,
"grad_norm": 0.8552572932480055,
"learning_rate": 1.352863920099114e-05,
"loss": 0.1346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08142690360546112,
"step": 5545,
"valid_targets_mean": 1609.0,
"valid_targets_min": 892
},
{
"epoch": 4.516076516076516,
"grad_norm": 0.9469817635167835,
"learning_rate": 1.3490256908053165e-05,
"loss": 0.1362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06301309913396835,
"step": 5550,
"valid_targets_mean": 1425.2,
"valid_targets_min": 801
},
{
"epoch": 4.52014652014652,
"grad_norm": 0.7579582875823737,
"learning_rate": 1.3451901412790485e-05,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06315524131059647,
"step": 5555,
"valid_targets_mean": 1462.4,
"valid_targets_min": 564
},
{
"epoch": 4.524216524216524,
"grad_norm": 0.7776282955223374,
"learning_rate": 1.341357287309537e-05,
"loss": 0.1266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06340664625167847,
"step": 5560,
"valid_targets_mean": 1749.1,
"valid_targets_min": 651
},
{
"epoch": 4.528286528286529,
"grad_norm": 0.8269577317944914,
"learning_rate": 1.3375271446749125e-05,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053509172052145004,
"step": 5565,
"valid_targets_mean": 1161.0,
"valid_targets_min": 716
},
{
"epoch": 4.532356532356532,
"grad_norm": 0.7967004348591504,
"learning_rate": 1.3336997291421441e-05,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06124432757496834,
"step": 5570,
"valid_targets_mean": 1425.6,
"valid_targets_min": 744
},
{
"epoch": 4.536426536426537,
"grad_norm": 0.7435104069530646,
"learning_rate": 1.3298750564669751e-05,
"loss": 0.1252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05810406804084778,
"step": 5575,
"valid_targets_mean": 1391.1,
"valid_targets_min": 1218
},
{
"epoch": 4.540496540496541,
"grad_norm": 0.7999784062535612,
"learning_rate": 1.3260531423938571e-05,
"loss": 0.1327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07500585913658142,
"step": 5580,
"valid_targets_mean": 1724.5,
"valid_targets_min": 793
},
{
"epoch": 4.544566544566544,
"grad_norm": 0.8510244277487944,
"learning_rate": 1.3222340026558855e-05,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06173360347747803,
"step": 5585,
"valid_targets_mean": 1366.8,
"valid_targets_min": 846
},
{
"epoch": 4.548636548636549,
"grad_norm": 0.8073160848727309,
"learning_rate": 1.3184176529747357e-05,
"loss": 0.1273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07489972561597824,
"step": 5590,
"valid_targets_mean": 1772.1,
"valid_targets_min": 979
},
{
"epoch": 4.552706552706553,
"grad_norm": 0.7253390941686678,
"learning_rate": 1.3146041090605977e-05,
"loss": 0.1351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07174719870090485,
"step": 5595,
"valid_targets_mean": 1778.9,
"valid_targets_min": 1093
},
{
"epoch": 4.556776556776557,
"grad_norm": 0.7424924022896014,
"learning_rate": 1.3107933866121117e-05,
"loss": 0.1167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0609469898045063,
"step": 5600,
"valid_targets_mean": 1510.8,
"valid_targets_min": 595
},
{
"epoch": 4.560846560846561,
"grad_norm": 0.8618358393453901,
"learning_rate": 1.306985501316302e-05,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06146273389458656,
"step": 5605,
"valid_targets_mean": 1330.4,
"valid_targets_min": 868
},
{
"epoch": 4.564916564916565,
"grad_norm": 0.8268278139473043,
"learning_rate": 1.3031804688485143e-05,
"loss": 0.1258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07098115980625153,
"step": 5610,
"valid_targets_mean": 1504.2,
"valid_targets_min": 914
},
{
"epoch": 4.568986568986569,
"grad_norm": 0.7720719541618248,
"learning_rate": 1.2993783048723515e-05,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07257020473480225,
"step": 5615,
"valid_targets_mean": 1972.9,
"valid_targets_min": 1080
},
{
"epoch": 4.573056573056573,
"grad_norm": 0.7939819756885284,
"learning_rate": 1.295579025039607e-05,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06880711764097214,
"step": 5620,
"valid_targets_mean": 1519.6,
"valid_targets_min": 658
},
{
"epoch": 4.5771265771265774,
"grad_norm": 0.7859404051654513,
"learning_rate": 1.2917826449902005e-05,
"loss": 0.1336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057696133852005005,
"step": 5625,
"valid_targets_mean": 1362.0,
"valid_targets_min": 1018
},
{
"epoch": 4.581196581196581,
"grad_norm": 0.828035069084943,
"learning_rate": 1.2879891803521167e-05,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07344723492860794,
"step": 5630,
"valid_targets_mean": 1623.0,
"valid_targets_min": 1041
},
{
"epoch": 4.585266585266585,
"grad_norm": 0.7735417380419619,
"learning_rate": 1.2841986467413384e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05607450753450394,
"step": 5635,
"valid_targets_mean": 2889.2,
"valid_targets_min": 534
},
{
"epoch": 4.58933658933659,
"grad_norm": 0.460850977797522,
"learning_rate": 1.2804110597617817e-05,
"loss": 0.111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05251425504684448,
"step": 5640,
"valid_targets_mean": 3423.9,
"valid_targets_min": 2404
},
{
"epoch": 4.593406593406593,
"grad_norm": 0.3657662471298085,
"learning_rate": 1.2766264350052334e-05,
"loss": 0.0806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041075143963098526,
"step": 5645,
"valid_targets_mean": 3592.0,
"valid_targets_min": 3064
},
{
"epoch": 4.597476597476597,
"grad_norm": 0.3851006948518706,
"learning_rate": 1.2728447880512862e-05,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039379969239234924,
"step": 5650,
"valid_targets_mean": 3425.4,
"valid_targets_min": 2901
},
{
"epoch": 4.601546601546602,
"grad_norm": 0.3982103509768099,
"learning_rate": 1.2690661344672755e-05,
"loss": 0.0948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0414591059088707,
"step": 5655,
"valid_targets_mean": 3393.9,
"valid_targets_min": 2392
},
{
"epoch": 4.605616605616605,
"grad_norm": 0.46756243462854763,
"learning_rate": 1.2652904898082117e-05,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034624554216861725,
"step": 5660,
"valid_targets_mean": 2066.5,
"valid_targets_min": 662
},
{
"epoch": 4.60968660968661,
"grad_norm": 0.8771981868563371,
"learning_rate": 1.2615178696167205e-05,
"loss": 0.1068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06684105098247528,
"step": 5665,
"valid_targets_mean": 1519.1,
"valid_targets_min": 724
},
{
"epoch": 4.613756613756614,
"grad_norm": 0.3782756354180073,
"learning_rate": 1.2577482894229777e-05,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04186592623591423,
"step": 5670,
"valid_targets_mean": 4022.1,
"valid_targets_min": 3668
},
{
"epoch": 4.617826617826617,
"grad_norm": 0.3867031798803203,
"learning_rate": 1.2539817647446446e-05,
"loss": 0.0872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04109447821974754,
"step": 5675,
"valid_targets_mean": 3483.0,
"valid_targets_min": 2891
},
{
"epoch": 4.621896621896622,
"grad_norm": 0.5812366237791688,
"learning_rate": 1.2502183110868031e-05,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09486156702041626,
"step": 5680,
"valid_targets_mean": 2689.9,
"valid_targets_min": 246
},
{
"epoch": 4.625966625966626,
"grad_norm": 0.28966277428771003,
"learning_rate": 1.2464579439418943e-05,
"loss": 0.0727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029673418030142784,
"step": 5685,
"valid_targets_mean": 5332.0,
"valid_targets_min": 886
},
{
"epoch": 4.63003663003663,
"grad_norm": 0.4205463767229215,
"learning_rate": 1.2427006787896537e-05,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03594677895307541,
"step": 5690,
"valid_targets_mean": 2137.1,
"valid_targets_min": 848
},
{
"epoch": 4.634106634106634,
"grad_norm": 0.31841598595521275,
"learning_rate": 1.2389465310970459e-05,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036279890686273575,
"step": 5695,
"valid_targets_mean": 3335.8,
"valid_targets_min": 758
},
{
"epoch": 4.638176638176638,
"grad_norm": 0.3807391992506858,
"learning_rate": 1.2351955163182039e-05,
"loss": 0.0948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04160192608833313,
"step": 5700,
"valid_targets_mean": 2811.1,
"valid_targets_min": 1146
},
{
"epoch": 4.642246642246643,
"grad_norm": 0.3742032229362971,
"learning_rate": 1.2314476498943622e-05,
"loss": 0.1083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04018232598900795,
"step": 5705,
"valid_targets_mean": 2773.0,
"valid_targets_min": 645
},
{
"epoch": 4.646316646316646,
"grad_norm": 0.3939537525171128,
"learning_rate": 1.2277029472537967e-05,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038491107523441315,
"step": 5710,
"valid_targets_mean": 2632.2,
"valid_targets_min": 579
},
{
"epoch": 4.6503866503866504,
"grad_norm": 0.4057474887227267,
"learning_rate": 1.2239614238117588e-05,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04323495551943779,
"step": 5715,
"valid_targets_mean": 2741.0,
"valid_targets_min": 1111
},
{
"epoch": 4.654456654456655,
"grad_norm": 0.5815162907436859,
"learning_rate": 1.2202230949704117e-05,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06871599704027176,
"step": 5720,
"valid_targets_mean": 2122.4,
"valid_targets_min": 812
},
{
"epoch": 4.658526658526658,
"grad_norm": 0.4521817666906546,
"learning_rate": 1.2164879761187691e-05,
"loss": 0.0871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03911435604095459,
"step": 5725,
"valid_targets_mean": 2335.0,
"valid_targets_min": 493
},
{
"epoch": 4.662596662596663,
"grad_norm": 0.47178406108628634,
"learning_rate": 1.212756082632631e-05,
"loss": 0.0865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03535778075456619,
"step": 5730,
"valid_targets_mean": 4099.9,
"valid_targets_min": 2949
},
{
"epoch": 4.666666666666667,
"grad_norm": 0.43766318103399476,
"learning_rate": 1.2090274298745172e-05,
"loss": 0.0942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04855756461620331,
"step": 5735,
"valid_targets_mean": 2667.8,
"valid_targets_min": 990
},
{
"epoch": 4.67073667073667,
"grad_norm": 0.5685037462804967,
"learning_rate": 1.2053020331936108e-05,
"loss": 0.1052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09078393876552582,
"step": 5740,
"valid_targets_mean": 1997.2,
"valid_targets_min": 974
},
{
"epoch": 4.674806674806675,
"grad_norm": 0.4814600386863112,
"learning_rate": 1.2015799079256876e-05,
"loss": 0.11,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053439922630786896,
"step": 5745,
"valid_targets_mean": 2656.1,
"valid_targets_min": 896
},
{
"epoch": 4.678876678876679,
"grad_norm": 0.4807779629525887,
"learning_rate": 1.1978610693930587e-05,
"loss": 0.0756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03917412832379341,
"step": 5750,
"valid_targets_mean": 1499.9,
"valid_targets_min": 550
},
{
"epoch": 4.682946682946683,
"grad_norm": 0.44551985651283915,
"learning_rate": 1.1941455329045047e-05,
"loss": 0.1135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04586545005440712,
"step": 5755,
"valid_targets_mean": 2963.0,
"valid_targets_min": 873
},
{
"epoch": 4.687016687016687,
"grad_norm": 0.4671700313248316,
"learning_rate": 1.1904333137552124e-05,
"loss": 0.0998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06650416553020477,
"step": 5760,
"valid_targets_mean": 3018.8,
"valid_targets_min": 1247
},
{
"epoch": 4.691086691086691,
"grad_norm": 0.54473726834285,
"learning_rate": 1.1867244272267136e-05,
"loss": 0.0842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05167562887072563,
"step": 5765,
"valid_targets_mean": 1737.4,
"valid_targets_min": 800
},
{
"epoch": 4.695156695156696,
"grad_norm": 0.6730426959023267,
"learning_rate": 1.1830188885868213e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13521423935890198,
"step": 5770,
"valid_targets_mean": 2176.9,
"valid_targets_min": 807
},
{
"epoch": 4.699226699226699,
"grad_norm": 0.4728336672436709,
"learning_rate": 1.1793167130895656e-05,
"loss": 0.1083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032692648470401764,
"step": 5775,
"valid_targets_mean": 1465.0,
"valid_targets_min": 507
},
{
"epoch": 4.7032967032967035,
"grad_norm": 0.3873581322887633,
"learning_rate": 1.1756179159751322e-05,
"loss": 0.0958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03570934757590294,
"step": 5780,
"valid_targets_mean": 3186.2,
"valid_targets_min": 658
},
{
"epoch": 4.707366707366708,
"grad_norm": 0.4264449290678136,
"learning_rate": 1.1719225124698003e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04953089728951454,
"step": 5785,
"valid_targets_mean": 3058.2,
"valid_targets_min": 826
},
{
"epoch": 4.711436711436711,
"grad_norm": 0.3737908843266182,
"learning_rate": 1.16823051778588e-05,
"loss": 0.0812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052201047539711,
"step": 5790,
"valid_targets_mean": 4502.5,
"valid_targets_min": 2131
},
{
"epoch": 4.715506715506716,
"grad_norm": 0.4570728348397021,
"learning_rate": 1.1645419471216462e-05,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056565217673778534,
"step": 5795,
"valid_targets_mean": 3669.0,
"valid_targets_min": 1746
},
{
"epoch": 4.71957671957672,
"grad_norm": 0.3818909080202796,
"learning_rate": 1.1608568156612807e-05,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03912724554538727,
"step": 5800,
"valid_targets_mean": 2759.6,
"valid_targets_min": 595
},
{
"epoch": 4.7236467236467234,
"grad_norm": 0.36574902640964757,
"learning_rate": 1.1571751385748082e-05,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04248278588056564,
"step": 5805,
"valid_targets_mean": 3420.0,
"valid_targets_min": 825
},
{
"epoch": 4.727716727716728,
"grad_norm": 0.36160705101402424,
"learning_rate": 1.1534969310180303e-05,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03156093508005142,
"step": 5810,
"valid_targets_mean": 3323.0,
"valid_targets_min": 687
},
{
"epoch": 4.731786731786732,
"grad_norm": 0.36054700912548693,
"learning_rate": 1.149822208132469e-05,
"loss": 0.075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041020315140485764,
"step": 5815,
"valid_targets_mean": 3504.0,
"valid_targets_min": 1956
},
{
"epoch": 4.735856735856736,
"grad_norm": 0.4108903603282782,
"learning_rate": 1.1461509850453e-05,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033342353999614716,
"step": 5820,
"valid_targets_mean": 3553.0,
"valid_targets_min": 1421
},
{
"epoch": 4.73992673992674,
"grad_norm": 0.43529092649816564,
"learning_rate": 1.1424832768692942e-05,
"loss": 0.0718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045596443116664886,
"step": 5825,
"valid_targets_mean": 3672.6,
"valid_targets_min": 1607
},
{
"epoch": 4.743996743996744,
"grad_norm": 0.31603285050379853,
"learning_rate": 1.1388190987027485e-05,
"loss": 0.1137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021315453574061394,
"step": 5830,
"valid_targets_mean": 2072.2,
"valid_targets_min": 535
},
{
"epoch": 4.748066748066748,
"grad_norm": 0.30398769091490463,
"learning_rate": 1.135158465629433e-05,
"loss": 0.0655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01872686669230461,
"step": 5835,
"valid_targets_mean": 2852.2,
"valid_targets_min": 583
},
{
"epoch": 4.752136752136752,
"grad_norm": 0.41779314691880687,
"learning_rate": 1.1315013927185224e-05,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03134084492921829,
"step": 5840,
"valid_targets_mean": 2778.2,
"valid_targets_min": 591
},
{
"epoch": 4.7562067562067565,
"grad_norm": 0.43596477198959716,
"learning_rate": 1.1278478950245364e-05,
"loss": 0.0685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040790289640426636,
"step": 5845,
"valid_targets_mean": 3474.1,
"valid_targets_min": 2154
},
{
"epoch": 4.76027676027676,
"grad_norm": 0.6262422674089861,
"learning_rate": 1.1241979875872748e-05,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0588751845061779,
"step": 5850,
"valid_targets_mean": 2075.6,
"valid_targets_min": 647
},
{
"epoch": 4.764346764346764,
"grad_norm": 0.4373065366822497,
"learning_rate": 1.120551685431761e-05,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07749606668949127,
"step": 5855,
"valid_targets_mean": 2382.5,
"valid_targets_min": 840
},
{
"epoch": 4.768416768416769,
"grad_norm": 0.44549286271516586,
"learning_rate": 1.1169090035681772e-05,
"loss": 0.1014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043722283095121384,
"step": 5860,
"valid_targets_mean": 2478.5,
"valid_targets_min": 684
},
{
"epoch": 4.772486772486772,
"grad_norm": 0.3836262029735173,
"learning_rate": 1.1132699569917982e-05,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033280737698078156,
"step": 5865,
"valid_targets_mean": 3505.0,
"valid_targets_min": 847
},
{
"epoch": 4.7765567765567765,
"grad_norm": 0.6061904603600585,
"learning_rate": 1.1096345606829388e-05,
"loss": 0.1076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04993060976266861,
"step": 5870,
"valid_targets_mean": 1690.6,
"valid_targets_min": 949
},
{
"epoch": 4.780626780626781,
"grad_norm": 0.45611765176673036,
"learning_rate": 1.1060028296068853e-05,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04060452803969383,
"step": 5875,
"valid_targets_mean": 3574.0,
"valid_targets_min": 2201
},
{
"epoch": 4.784696784696784,
"grad_norm": 0.714044002886353,
"learning_rate": 1.1023747787138361e-05,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04921393096446991,
"step": 5880,
"valid_targets_mean": 1174.5,
"valid_targets_min": 649
},
{
"epoch": 4.788766788766789,
"grad_norm": 0.44604008395762645,
"learning_rate": 1.0987504229388391e-05,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04379687458276749,
"step": 5885,
"valid_targets_mean": 3146.5,
"valid_targets_min": 707
},
{
"epoch": 4.792836792836793,
"grad_norm": 0.43017541020951683,
"learning_rate": 1.0951297772017319e-05,
"loss": 0.0847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045811258256435394,
"step": 5890,
"valid_targets_mean": 3508.5,
"valid_targets_min": 766
},
{
"epoch": 4.7969067969067964,
"grad_norm": 0.48390962547473454,
"learning_rate": 1.0915128564070803e-05,
"loss": 0.086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038865868002176285,
"step": 5895,
"valid_targets_mean": 2029.6,
"valid_targets_min": 516
},
{
"epoch": 4.800976800976801,
"grad_norm": 0.36825203623662306,
"learning_rate": 1.0878996754441151e-05,
"loss": 0.0702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04049721732735634,
"step": 5900,
"valid_targets_mean": 3818.9,
"valid_targets_min": 763
},
{
"epoch": 4.805046805046805,
"grad_norm": 0.43168309660573984,
"learning_rate": 1.0842902491866716e-05,
"loss": 0.0676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039305686950683594,
"step": 5905,
"valid_targets_mean": 4056.5,
"valid_targets_min": 2036
},
{
"epoch": 4.8091168091168095,
"grad_norm": 0.35933047571594207,
"learning_rate": 1.0806845924931296e-05,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03556220978498459,
"step": 5910,
"valid_targets_mean": 3477.1,
"valid_targets_min": 1122
},
{
"epoch": 4.813186813186813,
"grad_norm": 0.36322550413900717,
"learning_rate": 1.0770827202063505e-05,
"loss": 0.0969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02814421057701111,
"step": 5915,
"valid_targets_mean": 2432.0,
"valid_targets_min": 1139
},
{
"epoch": 4.817256817256817,
"grad_norm": 0.540577699819694,
"learning_rate": 1.073484647153619e-05,
"loss": 0.0918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04813909903168678,
"step": 5920,
"valid_targets_mean": 1705.1,
"valid_targets_min": 782
},
{
"epoch": 4.821326821326822,
"grad_norm": 0.2873896338117805,
"learning_rate": 1.0698903881465763e-05,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021741347387433052,
"step": 5925,
"valid_targets_mean": 4197.8,
"valid_targets_min": 4050
},
{
"epoch": 4.825396825396825,
"grad_norm": 0.34456005761736075,
"learning_rate": 1.0662999579811664e-05,
"loss": 0.0746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02447408251464367,
"step": 5930,
"valid_targets_mean": 3064.9,
"valid_targets_min": 945
},
{
"epoch": 4.8294668294668295,
"grad_norm": 0.49034557307772714,
"learning_rate": 1.06271337143757e-05,
"loss": 0.0931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05810309574007988,
"step": 5935,
"valid_targets_mean": 3935.9,
"valid_targets_min": 3235
},
{
"epoch": 4.833536833536834,
"grad_norm": 0.31610766883370367,
"learning_rate": 1.0591306432801467e-05,
"loss": 0.0697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032884612679481506,
"step": 5940,
"valid_targets_mean": 3656.0,
"valid_targets_min": 2848
},
{
"epoch": 4.837606837606837,
"grad_norm": 0.7350255340291643,
"learning_rate": 1.05555178825737e-05,
"loss": 0.0839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05409277603030205,
"step": 5945,
"valid_targets_mean": 1732.0,
"valid_targets_min": 742
},
{
"epoch": 4.841676841676842,
"grad_norm": 0.5190904613777559,
"learning_rate": 1.0519768211017726e-05,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054192811250686646,
"step": 5950,
"valid_targets_mean": 2964.1,
"valid_targets_min": 1547
},
{
"epoch": 4.845746845746846,
"grad_norm": 0.48868311864434977,
"learning_rate": 1.0484057565298822e-05,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04929513484239578,
"step": 5955,
"valid_targets_mean": 1643.6,
"valid_targets_min": 811
},
{
"epoch": 4.8498168498168495,
"grad_norm": 0.5380227640246409,
"learning_rate": 1.0448386092421586e-05,
"loss": 0.0945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04821448400616646,
"step": 5960,
"valid_targets_mean": 1432.5,
"valid_targets_min": 854
},
{
"epoch": 4.853886853886854,
"grad_norm": 0.5675102154058619,
"learning_rate": 1.0412753939229385e-05,
"loss": 0.0752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04497600346803665,
"step": 5965,
"valid_targets_mean": 1551.0,
"valid_targets_min": 886
},
{
"epoch": 4.857956857956858,
"grad_norm": 0.37368458137912997,
"learning_rate": 1.037716125240372e-05,
"loss": 0.0841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0343891903758049,
"step": 5970,
"valid_targets_mean": 3490.9,
"valid_targets_min": 2839
},
{
"epoch": 4.8620268620268625,
"grad_norm": 0.465690197105879,
"learning_rate": 1.0341608178463623e-05,
"loss": 0.1007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0349278599023819,
"step": 5975,
"valid_targets_mean": 3522.9,
"valid_targets_min": 1322
},
{
"epoch": 4.866096866096866,
"grad_norm": 0.4539769609059549,
"learning_rate": 1.0306094863765066e-05,
"loss": 0.0791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04086630046367645,
"step": 5980,
"valid_targets_mean": 2675.1,
"valid_targets_min": 623
},
{
"epoch": 4.87016687016687,
"grad_norm": 0.5194040935548523,
"learning_rate": 1.027062145450033e-05,
"loss": 0.0703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03959763050079346,
"step": 5985,
"valid_targets_mean": 2448.1,
"valid_targets_min": 690
},
{
"epoch": 4.874236874236875,
"grad_norm": 0.5286302251911614,
"learning_rate": 1.023518809669744e-05,
"loss": 0.091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07098161429166794,
"step": 5990,
"valid_targets_mean": 3094.1,
"valid_targets_min": 1804
},
{
"epoch": 4.878306878306878,
"grad_norm": 0.4012211699517951,
"learning_rate": 1.0199794936219554e-05,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04231107980012894,
"step": 5995,
"valid_targets_mean": 3015.2,
"valid_targets_min": 1605
},
{
"epoch": 4.8823768823768825,
"grad_norm": 0.48558169241283544,
"learning_rate": 1.0164442118764328e-05,
"loss": 0.065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04597931355237961,
"step": 6000,
"valid_targets_mean": 1446.4,
"valid_targets_min": 832
},
{
"epoch": 4.886446886446887,
"grad_norm": 0.46675560750287587,
"learning_rate": 1.0129129789863375e-05,
"loss": 0.0799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04974772036075592,
"step": 6005,
"valid_targets_mean": 3758.4,
"valid_targets_min": 1295
},
{
"epoch": 4.89051689051689,
"grad_norm": 0.3718508133031444,
"learning_rate": 1.0093858094881612e-05,
"loss": 0.075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029652055352926254,
"step": 6010,
"valid_targets_mean": 3927.1,
"valid_targets_min": 1057
},
{
"epoch": 4.894586894586895,
"grad_norm": 0.3548767930814201,
"learning_rate": 1.00586271790167e-05,
"loss": 0.0633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029149774461984634,
"step": 6015,
"valid_targets_mean": 3467.9,
"valid_targets_min": 853
},
{
"epoch": 4.898656898656899,
"grad_norm": 0.36526262775572454,
"learning_rate": 1.002343718729843e-05,
"loss": 0.0873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03588550537824631,
"step": 6020,
"valid_targets_mean": 4106.0,
"valid_targets_min": 3239
},
{
"epoch": 4.9027269027269025,
"grad_norm": 0.39347213994342317,
"learning_rate": 9.988288264588106e-06,
"loss": 0.0707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041096627712249756,
"step": 6025,
"valid_targets_mean": 3558.8,
"valid_targets_min": 769
},
{
"epoch": 4.906796906796907,
"grad_norm": 0.3567865777207391,
"learning_rate": 9.953180555578e-06,
"loss": 0.1034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03674373775720596,
"step": 6030,
"valid_targets_mean": 4000.0,
"valid_targets_min": 2959
},
{
"epoch": 4.910866910866911,
"grad_norm": 0.2939515031544418,
"learning_rate": 9.918114204790697e-06,
"loss": 0.0905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024303892627358437,
"step": 6035,
"valid_targets_mean": 3030.4,
"valid_targets_min": 629
},
{
"epoch": 4.914936914936915,
"grad_norm": 0.5314390212449058,
"learning_rate": 9.883089356578545e-06,
"loss": 0.0958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045132189989089966,
"step": 6040,
"valid_targets_mean": 3038.5,
"valid_targets_min": 1742
},
{
"epoch": 4.919006919006919,
"grad_norm": 0.33340762029888144,
"learning_rate": 9.848106155123045e-06,
"loss": 0.0701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02736440859735012,
"step": 6045,
"valid_targets_mean": 3813.6,
"valid_targets_min": 3003
},
{
"epoch": 4.923076923076923,
"grad_norm": 0.538168843602704,
"learning_rate": 9.813164744434256e-06,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0524737685918808,
"step": 6050,
"valid_targets_mean": 2625.8,
"valid_targets_min": 1025
},
{
"epoch": 4.927146927146927,
"grad_norm": 0.39397698811634346,
"learning_rate": 9.778265268350204e-06,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04419640451669693,
"step": 6055,
"valid_targets_mean": 3914.9,
"valid_targets_min": 3129
},
{
"epoch": 4.931216931216931,
"grad_norm": 0.788807885519458,
"learning_rate": 9.743407870536277e-06,
"loss": 0.1089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055179398506879807,
"step": 6060,
"valid_targets_mean": 1266.1,
"valid_targets_min": 458
},
{
"epoch": 4.9352869352869355,
"grad_norm": 0.4712531044323888,
"learning_rate": 9.708592694484655e-06,
"loss": 0.1036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03245309740304947,
"step": 6065,
"valid_targets_mean": 2087.1,
"valid_targets_min": 459
},
{
"epoch": 4.939356939356939,
"grad_norm": 0.5077235785209703,
"learning_rate": 9.673819883513727e-06,
"loss": 0.0858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06637755781412125,
"step": 6070,
"valid_targets_mean": 3098.8,
"valid_targets_min": 1694
},
{
"epoch": 4.943426943426943,
"grad_norm": 0.36026473643652757,
"learning_rate": 9.639089580767445e-06,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03487565368413925,
"step": 6075,
"valid_targets_mean": 4018.6,
"valid_targets_min": 3151
},
{
"epoch": 4.947496947496948,
"grad_norm": 0.42480201057736183,
"learning_rate": 9.604401929214805e-06,
"loss": 0.0778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033923834562301636,
"step": 6080,
"valid_targets_mean": 3190.0,
"valid_targets_min": 2197
},
{
"epoch": 4.951566951566951,
"grad_norm": 0.5467294848551612,
"learning_rate": 9.56975707164922e-06,
"loss": 0.0708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029525276273489,
"step": 6085,
"valid_targets_mean": 2252.9,
"valid_targets_min": 858
},
{
"epoch": 4.9556369556369555,
"grad_norm": 0.9869857674866476,
"learning_rate": 9.535155150687939e-06,
"loss": 0.087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07059233635663986,
"step": 6090,
"valid_targets_mean": 975.9,
"valid_targets_min": 563
},
{
"epoch": 4.95970695970696,
"grad_norm": 0.3873514877863149,
"learning_rate": 9.500596308771462e-06,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033523522317409515,
"step": 6095,
"valid_targets_mean": 3326.5,
"valid_targets_min": 701
},
{
"epoch": 4.963776963776963,
"grad_norm": 0.4142970786518696,
"learning_rate": 9.466080688162937e-06,
"loss": 0.0751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03642815351486206,
"step": 6100,
"valid_targets_mean": 3462.9,
"valid_targets_min": 2432
},
{
"epoch": 4.967846967846968,
"grad_norm": 0.4388097100302869,
"learning_rate": 9.431608430947619e-06,
"loss": 0.0724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03296447917819023,
"step": 6105,
"valid_targets_mean": 3280.9,
"valid_targets_min": 2018
},
{
"epoch": 4.971916971916972,
"grad_norm": 0.3737989484289901,
"learning_rate": 9.397179679032219e-06,
"loss": 0.0816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03461182862520218,
"step": 6110,
"valid_targets_mean": 3928.1,
"valid_targets_min": 485
},
{
"epoch": 4.975986975986976,
"grad_norm": 0.31608767099934815,
"learning_rate": 9.362794574144383e-06,
"loss": 0.0694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03851504623889923,
"step": 6115,
"valid_targets_mean": 4310.0,
"valid_targets_min": 800
},
{
"epoch": 4.98005698005698,
"grad_norm": 0.3283616246045454,
"learning_rate": 9.328453257832078e-06,
"loss": 0.0714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03032471239566803,
"step": 6120,
"valid_targets_mean": 4135.0,
"valid_targets_min": 740
},
{
"epoch": 4.984126984126984,
"grad_norm": 0.46368165314117155,
"learning_rate": 9.294155871463007e-06,
"loss": 0.0869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06997954845428467,
"step": 6125,
"valid_targets_mean": 3285.1,
"valid_targets_min": 1957
},
{
"epoch": 4.9881969881969885,
"grad_norm": 0.4185794895076128,
"learning_rate": 9.259902556224034e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04614701494574547,
"step": 6130,
"valid_targets_mean": 3392.6,
"valid_targets_min": 1137
},
{
"epoch": 4.992266992266992,
"grad_norm": 0.5563291333666768,
"learning_rate": 9.225693453120614e-06,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06407204270362854,
"step": 6135,
"valid_targets_mean": 1517.8,
"valid_targets_min": 716
},
{
"epoch": 4.996336996336996,
"grad_norm": 0.38670562354030985,
"learning_rate": 9.191528702976173e-06,
"loss": 0.072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03636377677321434,
"step": 6140,
"valid_targets_mean": 3538.4,
"valid_targets_min": 886
},
{
"epoch": 5.0,
"grad_norm": 0.4464669787231326,
"learning_rate": 9.15740844643159e-06,
"loss": 0.0996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051706526428461075,
"step": 6145,
"valid_targets_mean": 4028.4,
"valid_targets_min": 1273
},
{
"epoch": 5.004070004070004,
"grad_norm": 0.6854109342653534,
"learning_rate": 9.123332823944552e-06,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09130831062793732,
"step": 6150,
"valid_targets_mean": 7389.0,
"valid_targets_min": 5627
},
{
"epoch": 5.008140008140008,
"grad_norm": 0.6566317430199434,
"learning_rate": 9.089301975789029e-06,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049035608768463135,
"step": 6155,
"valid_targets_mean": 1294.8,
"valid_targets_min": 422
},
{
"epoch": 5.012210012210012,
"grad_norm": 0.414825686168276,
"learning_rate": 9.05531604205467e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09194067865610123,
"step": 6160,
"valid_targets_mean": 8539.9,
"valid_targets_min": 6761
},
{
"epoch": 5.0162800162800165,
"grad_norm": 0.40549825227625574,
"learning_rate": 9.021375162646233e-06,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08057986944913864,
"step": 6165,
"valid_targets_mean": 7579.0,
"valid_targets_min": 6174
},
{
"epoch": 5.02035002035002,
"grad_norm": 0.41714578888717524,
"learning_rate": 8.987479477282999e-06,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07731068134307861,
"step": 6170,
"valid_targets_mean": 7328.2,
"valid_targets_min": 4839
},
{
"epoch": 5.024420024420024,
"grad_norm": 0.40700870452137905,
"learning_rate": 8.953629125498227e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09170807898044586,
"step": 6175,
"valid_targets_mean": 6838.2,
"valid_targets_min": 5034
},
{
"epoch": 5.028490028490029,
"grad_norm": 0.3922582234171617,
"learning_rate": 8.919824246638528e-06,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09518324583768845,
"step": 6180,
"valid_targets_mean": 7248.2,
"valid_targets_min": 5567
},
{
"epoch": 5.032560032560032,
"grad_norm": 0.3805986393619526,
"learning_rate": 8.886064979863334e-06,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07861495763063431,
"step": 6185,
"valid_targets_mean": 6234.0,
"valid_targets_min": 5603
},
{
"epoch": 5.0366300366300365,
"grad_norm": 0.6374511935157152,
"learning_rate": 8.852351464144322e-06,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024300407618284225,
"step": 6190,
"valid_targets_mean": 602.0,
"valid_targets_min": 152
},
{
"epoch": 5.040700040700041,
"grad_norm": 0.40242759534056755,
"learning_rate": 8.818683838264826e-06,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08006134629249573,
"step": 6195,
"valid_targets_mean": 7299.9,
"valid_targets_min": 6158
},
{
"epoch": 5.044770044770045,
"grad_norm": 0.3913058263835821,
"learning_rate": 8.785062240819266e-06,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08000493794679642,
"step": 6200,
"valid_targets_mean": 6140.0,
"valid_targets_min": 4648
},
{
"epoch": 5.048840048840049,
"grad_norm": 0.4080986618966172,
"learning_rate": 8.751486810212599e-06,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08597160875797272,
"step": 6205,
"valid_targets_mean": 6603.0,
"valid_targets_min": 4882
},
{
"epoch": 5.052910052910053,
"grad_norm": 0.3727143747867664,
"learning_rate": 8.717957684659717e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08394499868154526,
"step": 6210,
"valid_targets_mean": 8015.0,
"valid_targets_min": 6344
},
{
"epoch": 5.056980056980057,
"grad_norm": 0.36991121771348234,
"learning_rate": 8.684475002184916e-06,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07384654879570007,
"step": 6215,
"valid_targets_mean": 6305.2,
"valid_targets_min": 4622
},
{
"epoch": 5.061050061050061,
"grad_norm": 0.3865770710996986,
"learning_rate": 8.651038900621277e-06,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0872340202331543,
"step": 6220,
"valid_targets_mean": 7890.8,
"valid_targets_min": 5485
},
{
"epoch": 5.065120065120065,
"grad_norm": 0.3847284521430894,
"learning_rate": 8.617649517610148e-06,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07563507556915283,
"step": 6225,
"valid_targets_mean": 7016.6,
"valid_targets_min": 4960
},
{
"epoch": 5.0691900691900695,
"grad_norm": 0.4213687533775985,
"learning_rate": 8.584306990600554e-06,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07866060733795166,
"step": 6230,
"valid_targets_mean": 6527.1,
"valid_targets_min": 5399
},
{
"epoch": 5.073260073260073,
"grad_norm": 0.46746065430470146,
"learning_rate": 8.55101145684864e-06,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07950198650360107,
"step": 6235,
"valid_targets_mean": 4995.0,
"valid_targets_min": 618
},
{
"epoch": 5.077330077330077,
"grad_norm": 0.42212928764720686,
"learning_rate": 8.517763053417095e-06,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09315831959247589,
"step": 6240,
"valid_targets_mean": 7219.4,
"valid_targets_min": 5764
},
{
"epoch": 5.081400081400082,
"grad_norm": 0.4077166480983304,
"learning_rate": 8.484561917174592e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08582858741283417,
"step": 6245,
"valid_targets_mean": 7998.5,
"valid_targets_min": 5902
},
{
"epoch": 5.085470085470085,
"grad_norm": 0.3787575234434601,
"learning_rate": 8.451408184795242e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06539824604988098,
"step": 6250,
"valid_targets_mean": 7377.4,
"valid_targets_min": 5015
},
{
"epoch": 5.0895400895400895,
"grad_norm": 0.3870195711380443,
"learning_rate": 8.418301992757984e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07054895162582397,
"step": 6255,
"valid_targets_mean": 6794.0,
"valid_targets_min": 5283
},
{
"epoch": 5.093610093610094,
"grad_norm": 0.41166952386174893,
"learning_rate": 8.385243477346095e-06,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09239070862531662,
"step": 6260,
"valid_targets_mean": 6656.4,
"valid_targets_min": 4364
},
{
"epoch": 5.097680097680097,
"grad_norm": 0.38241917148742083,
"learning_rate": 8.352232774646545e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07691332697868347,
"step": 6265,
"valid_targets_mean": 7178.4,
"valid_targets_min": 4448
},
{
"epoch": 5.101750101750102,
"grad_norm": 0.4136989734963614,
"learning_rate": 8.319270020549517e-06,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0996970385313034,
"step": 6270,
"valid_targets_mean": 7619.8,
"valid_targets_min": 5737
},
{
"epoch": 5.105820105820106,
"grad_norm": 0.37122078417443183,
"learning_rate": 8.286355350747795e-06,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07079966366291046,
"step": 6275,
"valid_targets_mean": 8754.4,
"valid_targets_min": 5752
},
{
"epoch": 5.1098901098901095,
"grad_norm": 0.41739380473502985,
"learning_rate": 8.253488900736226e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.077818363904953,
"step": 6280,
"valid_targets_mean": 6341.0,
"valid_targets_min": 4543
},
{
"epoch": 5.113960113960114,
"grad_norm": 0.41626778838918543,
"learning_rate": 8.220670805811156e-06,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0813712328672409,
"step": 6285,
"valid_targets_mean": 7181.9,
"valid_targets_min": 4563
},
{
"epoch": 5.118030118030118,
"grad_norm": 0.7414749413994536,
"learning_rate": 8.187901201069878e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051455169916152954,
"step": 6290,
"valid_targets_mean": 1104.4,
"valid_targets_min": 161
},
{
"epoch": 5.122100122100122,
"grad_norm": 0.42212437842472816,
"learning_rate": 8.155180221410062e-06,
"loss": 0.1523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07822007685899734,
"step": 6295,
"valid_targets_mean": 7018.2,
"valid_targets_min": 5424
},
{
"epoch": 5.126170126170126,
"grad_norm": 0.43199230917096043,
"learning_rate": 8.12250800152923e-06,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08775204420089722,
"step": 6300,
"valid_targets_mean": 7738.4,
"valid_targets_min": 5329
},
{
"epoch": 5.13024013024013,
"grad_norm": 0.4607805236152848,
"learning_rate": 8.089884675924155e-06,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08426693081855774,
"step": 6305,
"valid_targets_mean": 6426.6,
"valid_targets_min": 5560
},
{
"epoch": 5.134310134310135,
"grad_norm": 0.42455220317990994,
"learning_rate": 8.057310378890362e-06,
"loss": 0.171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0837627574801445,
"step": 6310,
"valid_targets_mean": 6169.9,
"valid_targets_min": 3446
},
{
"epoch": 5.138380138380138,
"grad_norm": 0.39791893535614575,
"learning_rate": 8.024785244521528e-06,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08946311473846436,
"step": 6315,
"valid_targets_mean": 7204.6,
"valid_targets_min": 5381
},
{
"epoch": 5.1424501424501425,
"grad_norm": 0.3868007797054446,
"learning_rate": 7.99230940670896e-06,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08641095459461212,
"step": 6320,
"valid_targets_mean": 7600.4,
"valid_targets_min": 5241
},
{
"epoch": 5.146520146520147,
"grad_norm": 0.39428677674139484,
"learning_rate": 7.959882999141032e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09060313552618027,
"step": 6325,
"valid_targets_mean": 7098.5,
"valid_targets_min": 5607
},
{
"epoch": 5.15059015059015,
"grad_norm": 0.4263247652696508,
"learning_rate": 7.92750615530264e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09046140313148499,
"step": 6330,
"valid_targets_mean": 6955.1,
"valid_targets_min": 5530
},
{
"epoch": 5.154660154660155,
"grad_norm": 0.4159005125904762,
"learning_rate": 7.895179008474634e-06,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08619844913482666,
"step": 6335,
"valid_targets_mean": 6748.1,
"valid_targets_min": 5364
},
{
"epoch": 5.158730158730159,
"grad_norm": 0.45512866927412166,
"learning_rate": 7.862901691733287e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0810968279838562,
"step": 6340,
"valid_targets_mean": 6273.9,
"valid_targets_min": 5438
},
{
"epoch": 5.1628001628001625,
"grad_norm": 0.4004779475142846,
"learning_rate": 7.830674337949756e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07858355343341827,
"step": 6345,
"valid_targets_mean": 6419.5,
"valid_targets_min": 4879
},
{
"epoch": 5.166870166870167,
"grad_norm": 0.4558820682158631,
"learning_rate": 7.798497079789513e-06,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07956701517105103,
"step": 6350,
"valid_targets_mean": 6483.4,
"valid_targets_min": 4309
},
{
"epoch": 5.170940170940171,
"grad_norm": 0.4440243865004471,
"learning_rate": 7.76637004971182e-06,
"loss": 0.1335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09749727696180344,
"step": 6355,
"valid_targets_mean": 6825.0,
"valid_targets_min": 5205
},
{
"epoch": 5.175010175010175,
"grad_norm": 0.4204178711309292,
"learning_rate": 7.734293379969157e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07635550945997238,
"step": 6360,
"valid_targets_mean": 6729.4,
"valid_targets_min": 5200
},
{
"epoch": 5.179080179080179,
"grad_norm": 0.42587388736681253,
"learning_rate": 7.702267202606709e-06,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07823633402585983,
"step": 6365,
"valid_targets_mean": 6094.0,
"valid_targets_min": 5302
},
{
"epoch": 5.183150183150183,
"grad_norm": 0.40638485768353844,
"learning_rate": 7.670291649461798e-06,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08494766801595688,
"step": 6370,
"valid_targets_mean": 7140.0,
"valid_targets_min": 5270
},
{
"epoch": 5.187220187220187,
"grad_norm": 0.3845786657820816,
"learning_rate": 7.638366852163348e-06,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07755722105503082,
"step": 6375,
"valid_targets_mean": 7425.0,
"valid_targets_min": 5281
},
{
"epoch": 5.191290191290191,
"grad_norm": 0.41277396807257505,
"learning_rate": 7.606492942131336e-06,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1049172580242157,
"step": 6380,
"valid_targets_mean": 7063.4,
"valid_targets_min": 5386
},
{
"epoch": 5.1953601953601956,
"grad_norm": 0.40861047918605575,
"learning_rate": 7.574670050576281e-06,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08464010059833527,
"step": 6385,
"valid_targets_mean": 6827.0,
"valid_targets_min": 4547
},
{
"epoch": 5.199430199430199,
"grad_norm": 0.5620066997157668,
"learning_rate": 7.542898308498663e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038255929946899414,
"step": 6390,
"valid_targets_mean": 2047.0,
"valid_targets_min": 165
},
{
"epoch": 5.203500203500203,
"grad_norm": 0.44632121984559203,
"learning_rate": 7.511177846688413e-06,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07810096442699432,
"step": 6395,
"valid_targets_mean": 6754.1,
"valid_targets_min": 5196
},
{
"epoch": 5.207570207570208,
"grad_norm": 0.4574803118753031,
"learning_rate": 7.479508795724361e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07977963984012604,
"step": 6400,
"valid_targets_mean": 5985.6,
"valid_targets_min": 5028
},
{
"epoch": 5.211640211640212,
"grad_norm": 0.42827249479040463,
"learning_rate": 7.447891285973705e-06,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07478997111320496,
"step": 6405,
"valid_targets_mean": 5963.9,
"valid_targets_min": 5237
},
{
"epoch": 5.2157102157102155,
"grad_norm": 0.4401945100045424,
"learning_rate": 7.416325447591468e-06,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08579155802726746,
"step": 6410,
"valid_targets_mean": 6319.0,
"valid_targets_min": 5412
},
{
"epoch": 5.21978021978022,
"grad_norm": 0.3872584192038548,
"learning_rate": 7.384811410519961e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06653904169797897,
"step": 6415,
"valid_targets_mean": 7125.8,
"valid_targets_min": 5080
},
{
"epoch": 5.223850223850224,
"grad_norm": 0.4118913981470542,
"learning_rate": 7.353349304488251e-06,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07929787784814835,
"step": 6420,
"valid_targets_mean": 6123.5,
"valid_targets_min": 4521
},
{
"epoch": 5.227920227920228,
"grad_norm": 0.8933632330027761,
"learning_rate": 7.321939259011639e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09677982330322266,
"step": 6425,
"valid_targets_mean": 1886.0,
"valid_targets_min": 1111
},
{
"epoch": 5.231990231990232,
"grad_norm": 0.7717354209997601,
"learning_rate": 7.29058140339111e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07828053832054138,
"step": 6430,
"valid_targets_mean": 1497.6,
"valid_targets_min": 893
},
{
"epoch": 5.236060236060236,
"grad_norm": 0.7156196156160548,
"learning_rate": 7.259275866712812e-06,
"loss": 0.1394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05080351233482361,
"step": 6435,
"valid_targets_mean": 1356.0,
"valid_targets_min": 914
},
{
"epoch": 5.24013024013024,
"grad_norm": 0.7775879541195082,
"learning_rate": 7.22802277784751e-06,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05790482088923454,
"step": 6440,
"valid_targets_mean": 1324.5,
"valid_targets_min": 680
},
{
"epoch": 5.244200244200244,
"grad_norm": 0.7428014404555288,
"learning_rate": 7.196822265450079e-06,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06787339597940445,
"step": 6445,
"valid_targets_mean": 1931.8,
"valid_targets_min": 876
},
{
"epoch": 5.248270248270249,
"grad_norm": 0.8246845467297721,
"learning_rate": 7.165674457958938e-06,
"loss": 0.1319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05890588089823723,
"step": 6450,
"valid_targets_mean": 1292.2,
"valid_targets_min": 734
},
{
"epoch": 5.252340252340252,
"grad_norm": 0.7747801015256733,
"learning_rate": 7.134579483595574e-06,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05581791326403618,
"step": 6455,
"valid_targets_mean": 1469.6,
"valid_targets_min": 655
},
{
"epoch": 5.256410256410256,
"grad_norm": 0.7889248714375038,
"learning_rate": 7.10353747036395e-06,
"loss": 0.1197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07032492756843567,
"step": 6460,
"valid_targets_mean": 1548.4,
"valid_targets_min": 737
},
{
"epoch": 5.260480260480261,
"grad_norm": 0.7576401372568481,
"learning_rate": 7.072548546050038e-06,
"loss": 0.1395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056093454360961914,
"step": 6465,
"valid_targets_mean": 1316.5,
"valid_targets_min": 759
},
{
"epoch": 5.264550264550264,
"grad_norm": 0.8148494000497493,
"learning_rate": 7.041612838221257e-06,
"loss": 0.1288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0493401475250721,
"step": 6470,
"valid_targets_mean": 1249.6,
"valid_targets_min": 753
},
{
"epoch": 5.2686202686202686,
"grad_norm": 0.8821896425064455,
"learning_rate": 7.010730474225958e-06,
"loss": 0.131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0843823179602623,
"step": 6475,
"valid_targets_mean": 1833.0,
"valid_targets_min": 927
},
{
"epoch": 5.272690272690273,
"grad_norm": 0.8128938462953682,
"learning_rate": 6.979901581192903e-06,
"loss": 0.1297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06127440556883812,
"step": 6480,
"valid_targets_mean": 1338.4,
"valid_targets_min": 679
},
{
"epoch": 5.276760276760276,
"grad_norm": 0.8516276560604461,
"learning_rate": 6.949126286030739e-06,
"loss": 0.1313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06296617537736893,
"step": 6485,
"valid_targets_mean": 1244.6,
"valid_targets_min": 771
},
{
"epoch": 5.280830280830281,
"grad_norm": 0.7641818533358684,
"learning_rate": 6.91840471542746e-06,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05841711908578873,
"step": 6490,
"valid_targets_mean": 1732.5,
"valid_targets_min": 986
},
{
"epoch": 5.284900284900285,
"grad_norm": 0.7751581720642792,
"learning_rate": 6.887736995849925e-06,
"loss": 0.1226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054849620908498764,
"step": 6495,
"valid_targets_mean": 1389.9,
"valid_targets_min": 1103
},
{
"epoch": 5.2889702889702885,
"grad_norm": 0.8647625768666302,
"learning_rate": 6.857123253543286e-06,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06798947602510452,
"step": 6500,
"valid_targets_mean": 1593.2,
"valid_targets_min": 675
},
{
"epoch": 5.293040293040293,
"grad_norm": 0.8101312346504578,
"learning_rate": 6.826563614530511e-06,
"loss": 0.131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07953788340091705,
"step": 6505,
"valid_targets_mean": 1926.6,
"valid_targets_min": 974
},
{
"epoch": 5.297110297110297,
"grad_norm": 0.8479150840387949,
"learning_rate": 6.7960582046118505e-06,
"loss": 0.1282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07549211382865906,
"step": 6510,
"valid_targets_mean": 1953.1,
"valid_targets_min": 869
},
{
"epoch": 5.301180301180302,
"grad_norm": 0.7598838779769721,
"learning_rate": 6.765607149364313e-06,
"loss": 0.1302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053766507655382156,
"step": 6515,
"valid_targets_mean": 1327.2,
"valid_targets_min": 1023
},
{
"epoch": 5.305250305250305,
"grad_norm": 1.6475991371156928,
"learning_rate": 6.735210574141158e-06,
"loss": 0.1296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06451068818569183,
"step": 6520,
"valid_targets_mean": 1717.9,
"valid_targets_min": 709
},
{
"epoch": 5.309320309320309,
"grad_norm": 0.8012862936876622,
"learning_rate": 6.704868604071362e-06,
"loss": 0.1261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05108807235956192,
"step": 6525,
"valid_targets_mean": 1139.9,
"valid_targets_min": 658
},
{
"epoch": 5.313390313390314,
"grad_norm": 1.10291965479662,
"learning_rate": 6.674581364059138e-06,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06254150718450546,
"step": 6530,
"valid_targets_mean": 1444.8,
"valid_targets_min": 662
},
{
"epoch": 5.317460317460317,
"grad_norm": 0.7975798780270608,
"learning_rate": 6.644348978783375e-06,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045557815581560135,
"step": 6535,
"valid_targets_mean": 1242.2,
"valid_targets_min": 859
},
{
"epoch": 5.321530321530322,
"grad_norm": 0.808432619410068,
"learning_rate": 6.614171572697172e-06,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06855520606040955,
"step": 6540,
"valid_targets_mean": 1569.2,
"valid_targets_min": 950
},
{
"epoch": 5.325600325600326,
"grad_norm": 0.8165752644870131,
"learning_rate": 6.584049270027291e-06,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058723099529743195,
"step": 6545,
"valid_targets_mean": 1539.8,
"valid_targets_min": 686
},
{
"epoch": 5.329670329670329,
"grad_norm": 0.8800699749983475,
"learning_rate": 6.553982194773663e-06,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07176946103572845,
"step": 6550,
"valid_targets_mean": 1610.6,
"valid_targets_min": 702
},
{
"epoch": 5.333740333740334,
"grad_norm": 0.7914141839534132,
"learning_rate": 6.523970470708874e-06,
"loss": 0.1199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04290122538805008,
"step": 6555,
"valid_targets_mean": 1190.4,
"valid_targets_min": 779
},
{
"epoch": 5.337810337810338,
"grad_norm": 0.8735942419573629,
"learning_rate": 6.494014221377654e-06,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06523449718952179,
"step": 6560,
"valid_targets_mean": 1467.1,
"valid_targets_min": 822
},
{
"epoch": 5.3418803418803416,
"grad_norm": 0.7904142925153533,
"learning_rate": 6.4641135700963555e-06,
"loss": 0.1188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0542932003736496,
"step": 6565,
"valid_targets_mean": 1350.5,
"valid_targets_min": 868
},
{
"epoch": 5.345950345950346,
"grad_norm": 0.8188017954142414,
"learning_rate": 6.434268639952482e-06,
"loss": 0.1246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052746959030628204,
"step": 6570,
"valid_targets_mean": 1283.5,
"valid_targets_min": 781
},
{
"epoch": 5.35002035002035,
"grad_norm": 0.8883502243806306,
"learning_rate": 6.4044795538041325e-06,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052638888359069824,
"step": 6575,
"valid_targets_mean": 1303.2,
"valid_targets_min": 793
},
{
"epoch": 5.354090354090354,
"grad_norm": 0.7346427480548663,
"learning_rate": 6.374746434279542e-06,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0480545237660408,
"step": 6580,
"valid_targets_mean": 1309.1,
"valid_targets_min": 806
},
{
"epoch": 5.358160358160358,
"grad_norm": 0.7749262088030695,
"learning_rate": 6.345069403776547e-06,
"loss": 0.1199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05063071846961975,
"step": 6585,
"valid_targets_mean": 1397.6,
"valid_targets_min": 803
},
{
"epoch": 5.362230362230362,
"grad_norm": 0.8904924291717923,
"learning_rate": 6.3154485844620935e-06,
"loss": 0.1202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045979805290699005,
"step": 6590,
"valid_targets_mean": 1187.8,
"valid_targets_min": 660
},
{
"epoch": 5.366300366300366,
"grad_norm": 0.8134025550512829,
"learning_rate": 6.285884098271739e-06,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05374240130186081,
"step": 6595,
"valid_targets_mean": 1547.0,
"valid_targets_min": 853
},
{
"epoch": 5.37037037037037,
"grad_norm": 0.8806055042632812,
"learning_rate": 6.25637606690912e-06,
"loss": 0.122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06583143770694733,
"step": 6600,
"valid_targets_mean": 1704.2,
"valid_targets_min": 719
},
{
"epoch": 5.374440374440375,
"grad_norm": 0.9022742278146144,
"learning_rate": 6.226924611845495e-06,
"loss": 0.1209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04527607560157776,
"step": 6605,
"valid_targets_mean": 1255.0,
"valid_targets_min": 765
},
{
"epoch": 5.378510378510379,
"grad_norm": 0.8451608246424978,
"learning_rate": 6.197529854319222e-06,
"loss": 0.1181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06376711279153824,
"step": 6610,
"valid_targets_mean": 1550.8,
"valid_targets_min": 875
},
{
"epoch": 5.382580382580382,
"grad_norm": 0.8477923753137665,
"learning_rate": 6.168191915335242e-06,
"loss": 0.1162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06021396815776825,
"step": 6615,
"valid_targets_mean": 1362.0,
"valid_targets_min": 739
},
{
"epoch": 5.386650386650387,
"grad_norm": 0.8811854153496774,
"learning_rate": 6.138910915664624e-06,
"loss": 0.1238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.069005087018013,
"step": 6620,
"valid_targets_mean": 1666.8,
"valid_targets_min": 760
},
{
"epoch": 5.390720390720391,
"grad_norm": 0.8205504832118758,
"learning_rate": 6.109686975844029e-06,
"loss": 0.1173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05043880641460419,
"step": 6625,
"valid_targets_mean": 1319.6,
"valid_targets_min": 1046
},
{
"epoch": 5.394790394790395,
"grad_norm": 1.1123497884965143,
"learning_rate": 6.080520216175236e-06,
"loss": 0.1249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06800902634859085,
"step": 6630,
"valid_targets_mean": 1727.9,
"valid_targets_min": 851
},
{
"epoch": 5.398860398860399,
"grad_norm": 0.8955095197538415,
"learning_rate": 6.051410756724638e-06,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06400962918996811,
"step": 6635,
"valid_targets_mean": 1643.2,
"valid_targets_min": 907
},
{
"epoch": 5.402930402930403,
"grad_norm": 0.867837643579163,
"learning_rate": 6.022358717322734e-06,
"loss": 0.135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05850240960717201,
"step": 6640,
"valid_targets_mean": 1478.5,
"valid_targets_min": 764
},
{
"epoch": 5.407000407000407,
"grad_norm": 0.7621902905404546,
"learning_rate": 5.993364217563671e-06,
"loss": 0.1176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05375190079212189,
"step": 6645,
"valid_targets_mean": 1522.6,
"valid_targets_min": 822
},
{
"epoch": 5.411070411070411,
"grad_norm": 0.8033822439060038,
"learning_rate": 5.964427376804726e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06127481535077095,
"step": 6650,
"valid_targets_mean": 1589.0,
"valid_targets_min": 982
},
{
"epoch": 5.415140415140415,
"grad_norm": 0.7789522955304922,
"learning_rate": 5.935548314165809e-06,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05730774253606796,
"step": 6655,
"valid_targets_mean": 1574.8,
"valid_targets_min": 816
},
{
"epoch": 5.419210419210419,
"grad_norm": 0.7825880008149688,
"learning_rate": 5.9067271485289945e-06,
"loss": 0.1141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05469139292836189,
"step": 6660,
"valid_targets_mean": 1422.0,
"valid_targets_min": 721
},
{
"epoch": 5.423280423280423,
"grad_norm": 0.8034253037962921,
"learning_rate": 5.877963998538019e-06,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04614481329917908,
"step": 6665,
"valid_targets_mean": 1150.6,
"valid_targets_min": 741
},
{
"epoch": 5.427350427350428,
"grad_norm": 0.8550910565715886,
"learning_rate": 5.849258982597801e-06,
"loss": 0.1183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06886758655309677,
"step": 6670,
"valid_targets_mean": 1684.2,
"valid_targets_min": 734
},
{
"epoch": 5.431420431420431,
"grad_norm": 0.9381725661390383,
"learning_rate": 5.820612218873927e-06,
"loss": 0.1204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07469278573989868,
"step": 6675,
"valid_targets_mean": 1937.1,
"valid_targets_min": 744
},
{
"epoch": 5.435490435490435,
"grad_norm": 0.8330098856323024,
"learning_rate": 5.792023825292201e-06,
"loss": 0.1207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06777373701334,
"step": 6680,
"valid_targets_mean": 1842.2,
"valid_targets_min": 620
},
{
"epoch": 5.43956043956044,
"grad_norm": 0.8473418521641808,
"learning_rate": 5.763493919538154e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06759806722402573,
"step": 6685,
"valid_targets_mean": 1637.6,
"valid_targets_min": 785
},
{
"epoch": 5.443630443630443,
"grad_norm": 0.8280879497111717,
"learning_rate": 5.735022619056521e-06,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06591871380805969,
"step": 6690,
"valid_targets_mean": 1969.9,
"valid_targets_min": 740
},
{
"epoch": 5.447700447700448,
"grad_norm": 0.8139854030624378,
"learning_rate": 5.706610041050806e-06,
"loss": 0.1152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05533464252948761,
"step": 6695,
"valid_targets_mean": 1432.1,
"valid_targets_min": 711
},
{
"epoch": 5.451770451770452,
"grad_norm": 0.8118262581872678,
"learning_rate": 5.678256302482772e-06,
"loss": 0.1224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06479828804731369,
"step": 6700,
"valid_targets_mean": 1695.6,
"valid_targets_min": 1122
},
{
"epoch": 5.455840455840455,
"grad_norm": 0.7908183689246445,
"learning_rate": 5.6499615200719735e-06,
"loss": 0.1174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06296779215335846,
"step": 6705,
"valid_targets_mean": 1524.5,
"valid_targets_min": 722
},
{
"epoch": 5.45991045991046,
"grad_norm": 0.8157309366372941,
"learning_rate": 5.621725810295264e-06,
"loss": 0.1128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05387778580188751,
"step": 6710,
"valid_targets_mean": 1289.2,
"valid_targets_min": 661
},
{
"epoch": 5.463980463980464,
"grad_norm": 0.7987860552011007,
"learning_rate": 5.593549289386315e-06,
"loss": 0.1107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055739592760801315,
"step": 6715,
"valid_targets_mean": 1519.5,
"valid_targets_min": 1011
},
{
"epoch": 5.4680504680504685,
"grad_norm": 0.8385843690819885,
"learning_rate": 5.565432073335153e-06,
"loss": 0.1237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0668364018201828,
"step": 6720,
"valid_targets_mean": 1731.4,
"valid_targets_min": 1277
},
{
"epoch": 5.472120472120472,
"grad_norm": 0.7910981905181974,
"learning_rate": 5.537374277887677e-06,
"loss": 0.1143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05977032706141472,
"step": 6725,
"valid_targets_mean": 1486.1,
"valid_targets_min": 807
},
{
"epoch": 5.476190476190476,
"grad_norm": 0.9696747865228715,
"learning_rate": 5.509376018545161e-06,
"loss": 0.1154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057927779853343964,
"step": 6730,
"valid_targets_mean": 1549.9,
"valid_targets_min": 679
},
{
"epoch": 5.480260480260481,
"grad_norm": 0.8421335406537752,
"learning_rate": 5.481437410563813e-06,
"loss": 0.1212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060152310878038406,
"step": 6735,
"valid_targets_mean": 1656.0,
"valid_targets_min": 1294
},
{
"epoch": 5.484330484330484,
"grad_norm": 0.7856036336209856,
"learning_rate": 5.4535585689542735e-06,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054788943380117416,
"step": 6740,
"valid_targets_mean": 1368.8,
"valid_targets_min": 790
},
{
"epoch": 5.488400488400488,
"grad_norm": 0.827864917037226,
"learning_rate": 5.4257396084811665e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06671278178691864,
"step": 6745,
"valid_targets_mean": 1765.8,
"valid_targets_min": 592
},
{
"epoch": 5.492470492470493,
"grad_norm": 0.8303973263376846,
"learning_rate": 5.397980643662586e-06,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06511053442955017,
"step": 6750,
"valid_targets_mean": 1586.8,
"valid_targets_min": 662
},
{
"epoch": 5.496540496540496,
"grad_norm": 0.8780460301609091,
"learning_rate": 5.370281788769673e-06,
"loss": 0.1163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05283388867974281,
"step": 6755,
"valid_targets_mean": 1336.9,
"valid_targets_min": 622
},
{
"epoch": 5.500610500610501,
"grad_norm": 0.8240875330044186,
"learning_rate": 5.342643157826117e-06,
"loss": 0.1131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03851066157221794,
"step": 6760,
"valid_targets_mean": 1097.1,
"valid_targets_min": 625
},
{
"epoch": 5.504680504680505,
"grad_norm": 0.8739039631522074,
"learning_rate": 5.315064864607695e-06,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05119139701128006,
"step": 6765,
"valid_targets_mean": 1484.9,
"valid_targets_min": 888
},
{
"epoch": 5.508750508750508,
"grad_norm": 0.8003068896738135,
"learning_rate": 5.287547022641788e-06,
"loss": 0.1228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06188352033495903,
"step": 6770,
"valid_targets_mean": 1757.0,
"valid_targets_min": 635
},
{
"epoch": 5.512820512820513,
"grad_norm": 0.927599280836426,
"learning_rate": 5.260089745206942e-06,
"loss": 0.118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06444002687931061,
"step": 6775,
"valid_targets_mean": 1476.1,
"valid_targets_min": 522
},
{
"epoch": 5.516890516890517,
"grad_norm": 0.824485847569823,
"learning_rate": 5.232693145332379e-06,
"loss": 0.1168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04994414374232292,
"step": 6780,
"valid_targets_mean": 1230.9,
"valid_targets_min": 697
},
{
"epoch": 5.520960520960521,
"grad_norm": 0.8214091658820951,
"learning_rate": 5.205357335797545e-06,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06151646375656128,
"step": 6785,
"valid_targets_mean": 1671.0,
"valid_targets_min": 1010
},
{
"epoch": 5.525030525030525,
"grad_norm": 0.880824287835339,
"learning_rate": 5.178082429131628e-06,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055703192949295044,
"step": 6790,
"valid_targets_mean": 1411.0,
"valid_targets_min": 769
},
{
"epoch": 5.529100529100529,
"grad_norm": 0.8856311775898162,
"learning_rate": 5.150868537613114e-06,
"loss": 0.1171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04835759103298187,
"step": 6795,
"valid_targets_mean": 1298.6,
"valid_targets_min": 745
},
{
"epoch": 5.533170533170534,
"grad_norm": 0.8530843893172676,
"learning_rate": 5.123715773269318e-06,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043554842472076416,
"step": 6800,
"valid_targets_mean": 1118.9,
"valid_targets_min": 680
},
{
"epoch": 5.537240537240537,
"grad_norm": 0.8234954694495478,
"learning_rate": 5.096624247875925e-06,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07579924166202545,
"step": 6805,
"valid_targets_mean": 1905.9,
"valid_targets_min": 1347
},
{
"epoch": 5.5413105413105415,
"grad_norm": 0.9238596830777893,
"learning_rate": 5.069594072956512e-06,
"loss": 0.1211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08299441635608673,
"step": 6810,
"valid_targets_mean": 1636.0,
"valid_targets_min": 851
},
{
"epoch": 5.545380545380546,
"grad_norm": 0.8280105418368178,
"learning_rate": 5.042625359782118e-06,
"loss": 0.1138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04978195205330849,
"step": 6815,
"valid_targets_mean": 1457.2,
"valid_targets_min": 903
},
{
"epoch": 5.549450549450549,
"grad_norm": 0.8327669041192984,
"learning_rate": 5.015718219370775e-06,
"loss": 0.1146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06120377779006958,
"step": 6820,
"valid_targets_mean": 1674.4,
"valid_targets_min": 1240
},
{
"epoch": 5.553520553520554,
"grad_norm": 0.6091529761830878,
"learning_rate": 4.988872762487029e-06,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.047283854335546494,
"step": 6825,
"valid_targets_mean": 1697.1,
"valid_targets_min": 917
},
{
"epoch": 5.557590557590558,
"grad_norm": 0.7831969192018885,
"learning_rate": 4.962089099641518e-06,
"loss": 0.1051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05221349745988846,
"step": 6830,
"valid_targets_mean": 1580.9,
"valid_targets_min": 930
},
{
"epoch": 5.561660561660561,
"grad_norm": 0.784999322544449,
"learning_rate": 4.935367341090498e-06,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059659071266651154,
"step": 6835,
"valid_targets_mean": 1655.1,
"valid_targets_min": 1227
},
{
"epoch": 5.565730565730566,
"grad_norm": 0.8561304848098958,
"learning_rate": 4.908707596835396e-06,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05701415240764618,
"step": 6840,
"valid_targets_mean": 1565.8,
"valid_targets_min": 870
},
{
"epoch": 5.56980056980057,
"grad_norm": 0.8237448435276692,
"learning_rate": 4.882109976622353e-06,
"loss": 0.114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05764477699995041,
"step": 6845,
"valid_targets_mean": 1564.6,
"valid_targets_min": 822
},
{
"epoch": 5.573870573870574,
"grad_norm": 0.9077557622146745,
"learning_rate": 4.855574589941763e-06,
"loss": 0.1199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05498945713043213,
"step": 6850,
"valid_targets_mean": 1540.5,
"valid_targets_min": 1214
},
{
"epoch": 5.577940577940578,
"grad_norm": 0.8208304804405712,
"learning_rate": 4.829101546027843e-06,
"loss": 0.1097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05034732073545456,
"step": 6855,
"valid_targets_mean": 1268.6,
"valid_targets_min": 591
},
{
"epoch": 5.582010582010582,
"grad_norm": 0.8341724291260191,
"learning_rate": 4.80269095385818e-06,
"loss": 0.1156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045787129551172256,
"step": 6860,
"valid_targets_mean": 1232.5,
"valid_targets_min": 646
},
{
"epoch": 5.586080586080586,
"grad_norm": 0.6220953592726438,
"learning_rate": 4.776342922153252e-06,
"loss": 0.1074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04945782572031021,
"step": 6865,
"valid_targets_mean": 3032.8,
"valid_targets_min": 2115
},
{
"epoch": 5.59015059015059,
"grad_norm": 0.514602989750909,
"learning_rate": 4.750057559376027e-06,
"loss": 0.0989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03673814609646797,
"step": 6870,
"valid_targets_mean": 2553.1,
"valid_targets_min": 324
},
{
"epoch": 5.5942205942205945,
"grad_norm": 0.4451969667171798,
"learning_rate": 4.72383497373148e-06,
"loss": 0.0786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04091775789856911,
"step": 6875,
"valid_targets_mean": 2212.5,
"valid_targets_min": 982
},
{
"epoch": 5.598290598290598,
"grad_norm": 0.6233305674965636,
"learning_rate": 4.6976752731661755e-06,
"loss": 0.0736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042984090745449066,
"step": 6880,
"valid_targets_mean": 3619.4,
"valid_targets_min": 2479
},
{
"epoch": 5.602360602360602,
"grad_norm": 0.3301906624858536,
"learning_rate": 4.671578565367783e-06,
"loss": 0.0838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027935273945331573,
"step": 6885,
"valid_targets_mean": 3030.5,
"valid_targets_min": 811
},
{
"epoch": 5.606430606430607,
"grad_norm": 0.3998270887471306,
"learning_rate": 4.645544957764683e-06,
"loss": 0.0766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041048966348171234,
"step": 6890,
"valid_targets_mean": 2922.1,
"valid_targets_min": 1431
},
{
"epoch": 5.61050061050061,
"grad_norm": 0.7362755403982966,
"learning_rate": 4.619574557525497e-06,
"loss": 0.1112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09079274535179138,
"step": 6895,
"valid_targets_mean": 1991.0,
"valid_targets_min": 703
},
{
"epoch": 5.6145706145706145,
"grad_norm": 0.3819808054209917,
"learning_rate": 4.5936674715586335e-06,
"loss": 0.0923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045745231211185455,
"step": 6900,
"valid_targets_mean": 3251.1,
"valid_targets_min": 621
},
{
"epoch": 5.618640618640619,
"grad_norm": 0.4913669321147579,
"learning_rate": 4.567823806511882e-06,
"loss": 0.0844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0513700470328331,
"step": 6905,
"valid_targets_mean": 2681.1,
"valid_targets_min": 846
},
{
"epoch": 5.622710622710622,
"grad_norm": 0.46623010414455635,
"learning_rate": 4.542043668771956e-06,
"loss": 0.1154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05827459692955017,
"step": 6910,
"valid_targets_mean": 3618.6,
"valid_targets_min": 1369
},
{
"epoch": 5.626780626780627,
"grad_norm": 0.40350792589628737,
"learning_rate": 4.516327164464045e-06,
"loss": 0.0608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03749353438615799,
"step": 6915,
"valid_targets_mean": 2980.5,
"valid_targets_min": 754
},
{
"epoch": 5.630850630850631,
"grad_norm": 0.44644536414753183,
"learning_rate": 4.490674399451404e-06,
"loss": 0.0748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04275457561016083,
"step": 6920,
"valid_targets_mean": 2610.8,
"valid_targets_min": 776
},
{
"epoch": 5.634920634920634,
"grad_norm": 0.3716682275188854,
"learning_rate": 4.465085479334881e-06,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04192643612623215,
"step": 6925,
"valid_targets_mean": 3132.1,
"valid_targets_min": 754
},
{
"epoch": 5.638990638990639,
"grad_norm": 0.6737602005566654,
"learning_rate": 4.439560509452521e-06,
"loss": 0.1201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1757407784461975,
"step": 6930,
"valid_targets_mean": 2020.8,
"valid_targets_min": 664
},
{
"epoch": 5.643060643060643,
"grad_norm": 0.38494643743663376,
"learning_rate": 4.414099594879116e-06,
"loss": 0.0683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04006730392575264,
"step": 6935,
"valid_targets_mean": 3713.8,
"valid_targets_min": 2542
},
{
"epoch": 5.6471306471306475,
"grad_norm": 0.42182454234126665,
"learning_rate": 4.388702840425747e-06,
"loss": 0.0745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050172992050647736,
"step": 6940,
"valid_targets_mean": 3191.9,
"valid_targets_min": 1462
},
{
"epoch": 5.651200651200651,
"grad_norm": 0.42723433064009736,
"learning_rate": 4.363370350639405e-06,
"loss": 0.0672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045071978121995926,
"step": 6945,
"valid_targets_mean": 3721.0,
"valid_targets_min": 3281
},
{
"epoch": 5.655270655270655,
"grad_norm": 0.4697371582365796,
"learning_rate": 4.338102229802519e-06,
"loss": 0.0768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037965573370456696,
"step": 6950,
"valid_targets_mean": 3360.4,
"valid_targets_min": 2189
},
{
"epoch": 5.65934065934066,
"grad_norm": 0.3866243720482525,
"learning_rate": 4.312898581932543e-06,
"loss": 0.0754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033566609025001526,
"step": 6955,
"valid_targets_mean": 3223.9,
"valid_targets_min": 1590
},
{
"epoch": 5.663410663410663,
"grad_norm": 0.5221435785464758,
"learning_rate": 4.287759510781531e-06,
"loss": 0.0876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05182216316461563,
"step": 6960,
"valid_targets_mean": 2352.1,
"valid_targets_min": 597
},
{
"epoch": 5.6674806674806675,
"grad_norm": 0.4315745464727039,
"learning_rate": 4.262685119835681e-06,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04116567224264145,
"step": 6965,
"valid_targets_mean": 2612.9,
"valid_targets_min": 701
},
{
"epoch": 5.671550671550672,
"grad_norm": 0.5037919896206252,
"learning_rate": 4.237675512314963e-06,
"loss": 0.112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08254027366638184,
"step": 6970,
"valid_targets_mean": 2791.8,
"valid_targets_min": 1652
},
{
"epoch": 5.675620675620675,
"grad_norm": 0.37428492562737725,
"learning_rate": 4.212730791172637e-06,
"loss": 0.0828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030793912708759308,
"step": 6975,
"valid_targets_mean": 3704.5,
"valid_targets_min": 1908
},
{
"epoch": 5.67969067969068,
"grad_norm": 0.734812670763522,
"learning_rate": 4.1878510590948675e-06,
"loss": 0.0707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030109543353319168,
"step": 6980,
"valid_targets_mean": 3204.0,
"valid_targets_min": 842
},
{
"epoch": 5.683760683760684,
"grad_norm": 0.4553294615748584,
"learning_rate": 4.163036418500288e-06,
"loss": 0.1071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0399131178855896,
"step": 6985,
"valid_targets_mean": 3402.9,
"valid_targets_min": 2552
},
{
"epoch": 5.6878306878306875,
"grad_norm": 0.3690385553206738,
"learning_rate": 4.138286971539578e-06,
"loss": 0.0883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030925989151000977,
"step": 6990,
"valid_targets_mean": 2979.9,
"valid_targets_min": 753
},
{
"epoch": 5.691900691900692,
"grad_norm": 0.5807379632235751,
"learning_rate": 4.113602820095046e-06,
"loss": 0.0862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05012385547161102,
"step": 6995,
"valid_targets_mean": 1296.9,
"valid_targets_min": 568
},
{
"epoch": 5.695970695970696,
"grad_norm": 0.5547047028197435,
"learning_rate": 4.088984065780211e-06,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10247977077960968,
"step": 7000,
"valid_targets_mean": 3126.9,
"valid_targets_min": 1070
},
{
"epoch": 5.7000407000407005,
"grad_norm": 0.5537368442018135,
"learning_rate": 4.064430809939366e-06,
"loss": 0.0833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041642434895038605,
"step": 7005,
"valid_targets_mean": 2456.6,
"valid_targets_min": 329
},
{
"epoch": 5.704110704110704,
"grad_norm": 0.6592126673581086,
"learning_rate": 4.039943153647199e-06,
"loss": 0.0868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04998764768242836,
"step": 7010,
"valid_targets_mean": 1027.8,
"valid_targets_min": 608
},
{
"epoch": 5.708180708180708,
"grad_norm": 0.460024733008231,
"learning_rate": 4.015521197708332e-06,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048872776329517365,
"step": 7015,
"valid_targets_mean": 4479.8,
"valid_targets_min": 2772
},
{
"epoch": 5.712250712250713,
"grad_norm": 0.27240175134306893,
"learning_rate": 3.9911650426569435e-06,
"loss": 0.0681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022211387753486633,
"step": 7020,
"valid_targets_mean": 4843.0,
"valid_targets_min": 3778
},
{
"epoch": 5.716320716320716,
"grad_norm": 0.679333960574683,
"learning_rate": 3.966874788756334e-06,
"loss": 0.0857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03754306584596634,
"step": 7025,
"valid_targets_mean": 4306.0,
"valid_targets_min": 2336
},
{
"epoch": 5.7203907203907205,
"grad_norm": 0.4459001490448593,
"learning_rate": 3.942650535998524e-06,
"loss": 0.0806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04726475849747658,
"step": 7030,
"valid_targets_mean": 3579.5,
"valid_targets_min": 846
},
{
"epoch": 5.724460724460725,
"grad_norm": 0.44157380368224075,
"learning_rate": 3.9184923841038295e-06,
"loss": 0.0716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04266761243343353,
"step": 7035,
"valid_targets_mean": 2909.1,
"valid_targets_min": 798
},
{
"epoch": 5.728530728530728,
"grad_norm": 0.4449017607427598,
"learning_rate": 3.894400432520469e-06,
"loss": 0.0689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02835097163915634,
"step": 7040,
"valid_targets_mean": 2008.5,
"valid_targets_min": 533
},
{
"epoch": 5.732600732600733,
"grad_norm": 0.4703351541184157,
"learning_rate": 3.870374780424131e-06,
"loss": 0.0723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03980240598320961,
"step": 7045,
"valid_targets_mean": 2598.2,
"valid_targets_min": 833
},
{
"epoch": 5.736670736670737,
"grad_norm": 0.3551380809469693,
"learning_rate": 3.846415526717582e-06,
"loss": 0.0685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0330246202647686,
"step": 7050,
"valid_targets_mean": 4031.8,
"valid_targets_min": 3391
},
{
"epoch": 5.7407407407407405,
"grad_norm": 0.5831858604258909,
"learning_rate": 3.8225227700302616e-06,
"loss": 0.0848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10323013365268707,
"step": 7055,
"valid_targets_mean": 1909.9,
"valid_targets_min": 732
},
{
"epoch": 5.744810744810745,
"grad_norm": 0.5066452107972234,
"learning_rate": 3.7986966087178733e-06,
"loss": 0.0908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03759615123271942,
"step": 7060,
"valid_targets_mean": 1908.9,
"valid_targets_min": 538
},
{
"epoch": 5.748880748880749,
"grad_norm": 0.528867423320594,
"learning_rate": 3.7749371408619718e-06,
"loss": 0.0595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032433267682790756,
"step": 7065,
"valid_targets_mean": 824.9,
"valid_targets_min": 720
},
{
"epoch": 5.752950752950753,
"grad_norm": 0.41003167533389645,
"learning_rate": 3.751244464269568e-06,
"loss": 0.0647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0331251323223114,
"step": 7070,
"valid_targets_mean": 3181.1,
"valid_targets_min": 2328
},
{
"epoch": 5.757020757020757,
"grad_norm": 0.48249588908464164,
"learning_rate": 3.727618676472724e-06,
"loss": 0.0628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028061306104063988,
"step": 7075,
"valid_targets_mean": 2581.4,
"valid_targets_min": 684
},
{
"epoch": 5.761090761090761,
"grad_norm": 0.444459931043437,
"learning_rate": 3.704059874728141e-06,
"loss": 0.1082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04039149731397629,
"step": 7080,
"valid_targets_mean": 3461.2,
"valid_targets_min": 2795
},
{
"epoch": 5.765160765160765,
"grad_norm": 0.43861111289426047,
"learning_rate": 3.680568156016786e-06,
"loss": 0.0816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0352468304336071,
"step": 7085,
"valid_targets_mean": 3382.6,
"valid_targets_min": 744
},
{
"epoch": 5.769230769230769,
"grad_norm": 0.3633878194360417,
"learning_rate": 3.6571436170434547e-06,
"loss": 0.0859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02400396391749382,
"step": 7090,
"valid_targets_mean": 3966.6,
"valid_targets_min": 3279
},
{
"epoch": 5.7733007733007735,
"grad_norm": 0.6690219140055973,
"learning_rate": 3.633786354236415e-06,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035930804908275604,
"step": 7095,
"valid_targets_mean": 792.1,
"valid_targets_min": 536
},
{
"epoch": 5.777370777370777,
"grad_norm": 0.6422113838762212,
"learning_rate": 3.6104964637469755e-06,
"loss": 0.1166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04105771332979202,
"step": 7100,
"valid_targets_mean": 2227.4,
"valid_targets_min": 853
},
{
"epoch": 5.781440781440781,
"grad_norm": 0.4559712074457705,
"learning_rate": 3.5872740414491093e-06,
"loss": 0.0771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04004089534282684,
"step": 7105,
"valid_targets_mean": 3105.6,
"valid_targets_min": 2621
},
{
"epoch": 5.785510785510786,
"grad_norm": 0.6237273326303014,
"learning_rate": 3.564119182939052e-06,
"loss": 0.1027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04093822091817856,
"step": 7110,
"valid_targets_mean": 1028.0,
"valid_targets_min": 728
},
{
"epoch": 5.789580789580789,
"grad_norm": 0.5635603145419109,
"learning_rate": 3.541031983534915e-06,
"loss": 0.0706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04176001995801926,
"step": 7115,
"valid_targets_mean": 1574.2,
"valid_targets_min": 618
},
{
"epoch": 5.7936507936507935,
"grad_norm": 0.36319222074079344,
"learning_rate": 3.5180125382762674e-06,
"loss": 0.0744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042091649025678635,
"step": 7120,
"valid_targets_mean": 4135.0,
"valid_targets_min": 907
},
{
"epoch": 5.797720797720798,
"grad_norm": 0.6553513990147538,
"learning_rate": 3.4950609419237956e-06,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0537349097430706,
"step": 7125,
"valid_targets_mean": 3060.8,
"valid_targets_min": 580
},
{
"epoch": 5.801790801790801,
"grad_norm": 0.3897873956243497,
"learning_rate": 3.4721772889588533e-06,
"loss": 0.0642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031878359615802765,
"step": 7130,
"valid_targets_mean": 3413.8,
"valid_targets_min": 726
},
{
"epoch": 5.805860805860806,
"grad_norm": 0.7307214688735437,
"learning_rate": 3.4493616735831205e-06,
"loss": 0.0627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0403984859585762,
"step": 7135,
"valid_targets_mean": 4560.9,
"valid_targets_min": 2613
},
{
"epoch": 5.80993080993081,
"grad_norm": 0.4526517648913433,
"learning_rate": 3.4266141897181917e-06,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04063914343714714,
"step": 7140,
"valid_targets_mean": 2847.2,
"valid_targets_min": 531
},
{
"epoch": 5.814000814000814,
"grad_norm": 0.48774825169971975,
"learning_rate": 3.4039349310051973e-06,
"loss": 0.0897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035396378487348557,
"step": 7145,
"valid_targets_mean": 2571.5,
"valid_targets_min": 826
},
{
"epoch": 5.818070818070818,
"grad_norm": 0.4021017225060565,
"learning_rate": 3.3813239908044104e-06,
"loss": 0.085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034908998757600784,
"step": 7150,
"valid_targets_mean": 3709.6,
"valid_targets_min": 3024
},
{
"epoch": 5.822140822140822,
"grad_norm": 0.3908988537537165,
"learning_rate": 3.358781462194878e-06,
"loss": 0.0733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0368090383708477,
"step": 7155,
"valid_targets_mean": 3559.0,
"valid_targets_min": 2588
},
{
"epoch": 5.8262108262108265,
"grad_norm": 0.5606060832836967,
"learning_rate": 3.336307437974011e-06,
"loss": 0.0756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05241452157497406,
"step": 7160,
"valid_targets_mean": 913.9,
"valid_targets_min": 502
},
{
"epoch": 5.83028083028083,
"grad_norm": 0.44223267919961007,
"learning_rate": 3.313902010657226e-06,
"loss": 0.08,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032404445111751556,
"step": 7165,
"valid_targets_mean": 3301.9,
"valid_targets_min": 1158
},
{
"epoch": 5.834350834350834,
"grad_norm": 0.3154823634128118,
"learning_rate": 3.2915652724775616e-06,
"loss": 0.0588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027957221493124962,
"step": 7170,
"valid_targets_mean": 3874.9,
"valid_targets_min": 3044
},
{
"epoch": 5.838420838420839,
"grad_norm": 0.4259827920303877,
"learning_rate": 3.2692973153852936e-06,
"loss": 0.0792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03220093250274658,
"step": 7175,
"valid_targets_mean": 2167.8,
"valid_targets_min": 539
},
{
"epoch": 5.842490842490842,
"grad_norm": 0.42833294388406135,
"learning_rate": 3.247098231047552e-06,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03128783777356148,
"step": 7180,
"valid_targets_mean": 2397.0,
"valid_targets_min": 387
},
{
"epoch": 5.8465608465608465,
"grad_norm": 0.5739666740538348,
"learning_rate": 3.22496811084795e-06,
"loss": 0.0823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04366585612297058,
"step": 7185,
"valid_targets_mean": 2340.9,
"valid_targets_min": 872
},
{
"epoch": 5.850630850630851,
"grad_norm": 0.41911962257836954,
"learning_rate": 3.2029070458862145e-06,
"loss": 0.0763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0234956294298172,
"step": 7190,
"valid_targets_mean": 3017.2,
"valid_targets_min": 822
},
{
"epoch": 5.854700854700854,
"grad_norm": 0.7353086790754305,
"learning_rate": 3.180915126977795e-06,
"loss": 0.0796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05614851415157318,
"step": 7195,
"valid_targets_mean": 1405.9,
"valid_targets_min": 605
},
{
"epoch": 5.858770858770859,
"grad_norm": 0.4594492349495658,
"learning_rate": 3.158992444653497e-06,
"loss": 0.0707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043180473148822784,
"step": 7200,
"valid_targets_mean": 2249.2,
"valid_targets_min": 808
},
{
"epoch": 5.862840862840863,
"grad_norm": 0.41266900678804913,
"learning_rate": 3.137139089159109e-06,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035402562469244,
"step": 7205,
"valid_targets_mean": 2900.5,
"valid_targets_min": 1010
},
{
"epoch": 5.866910866910867,
"grad_norm": 0.41094688449906835,
"learning_rate": 3.1153551504550397e-06,
"loss": 0.0711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02497289329767227,
"step": 7210,
"valid_targets_mean": 2432.6,
"valid_targets_min": 524
},
{
"epoch": 5.870980870980871,
"grad_norm": 0.47665813139114804,
"learning_rate": 3.0936407182159333e-06,
"loss": 0.0659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02819974161684513,
"step": 7215,
"valid_targets_mean": 1303.5,
"valid_targets_min": 516
},
{
"epoch": 5.875050875050875,
"grad_norm": 0.5054406457987558,
"learning_rate": 3.0719958818303165e-06,
"loss": 0.0841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032017797231674194,
"step": 7220,
"valid_targets_mean": 1762.1,
"valid_targets_min": 342
},
{
"epoch": 5.8791208791208796,
"grad_norm": 0.39611619386986135,
"learning_rate": 3.050420730400212e-06,
"loss": 0.0782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03306104242801666,
"step": 7225,
"valid_targets_mean": 3301.8,
"valid_targets_min": 1440
},
{
"epoch": 5.883190883190883,
"grad_norm": 0.44746690647319465,
"learning_rate": 3.0289153527407842e-06,
"loss": 0.0613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031408607959747314,
"step": 7230,
"valid_targets_mean": 2274.2,
"valid_targets_min": 708
},
{
"epoch": 5.887260887260887,
"grad_norm": 0.3541822938829694,
"learning_rate": 3.007479837379974e-06,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030303731560707092,
"step": 7235,
"valid_targets_mean": 5103.1,
"valid_targets_min": 3653
},
{
"epoch": 5.891330891330892,
"grad_norm": 0.35916098515876993,
"learning_rate": 2.9861142725581225e-06,
"loss": 0.068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02420351281762123,
"step": 7240,
"valid_targets_mean": 2366.5,
"valid_targets_min": 684
},
{
"epoch": 5.895400895400895,
"grad_norm": 0.3952741270339185,
"learning_rate": 2.96481874622762e-06,
"loss": 0.0586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034595150500535965,
"step": 7245,
"valid_targets_mean": 3352.1,
"valid_targets_min": 726
},
{
"epoch": 5.8994708994708995,
"grad_norm": 0.33735128445439605,
"learning_rate": 2.94359334605254e-06,
"loss": 0.082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03757286071777344,
"step": 7250,
"valid_targets_mean": 4009.6,
"valid_targets_min": 3076
},
{
"epoch": 5.903540903540904,
"grad_norm": 0.5708917806995089,
"learning_rate": 2.9224381594082807e-06,
"loss": 0.0917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14005272090435028,
"step": 7255,
"valid_targets_mean": 2811.9,
"valid_targets_min": 1536
},
{
"epoch": 5.907610907610907,
"grad_norm": 0.39275014659707425,
"learning_rate": 2.9013532733812e-06,
"loss": 0.0702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03683479502797127,
"step": 7260,
"valid_targets_mean": 2669.4,
"valid_targets_min": 582
},
{
"epoch": 5.911680911680912,
"grad_norm": 0.34548880597408943,
"learning_rate": 2.880338774768263e-06,
"loss": 0.0819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025920607149600983,
"step": 7265,
"valid_targets_mean": 3261.9,
"valid_targets_min": 633
},
{
"epoch": 5.915750915750916,
"grad_norm": 0.37519369539071246,
"learning_rate": 2.8593947500766805e-06,
"loss": 0.0921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02501959726214409,
"step": 7270,
"valid_targets_mean": 3287.2,
"valid_targets_min": 1130
},
{
"epoch": 5.9198209198209195,
"grad_norm": 0.5057331987244915,
"learning_rate": 2.8385212855235477e-06,
"loss": 0.0668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03711901605129242,
"step": 7275,
"valid_targets_mean": 2858.9,
"valid_targets_min": 492
},
{
"epoch": 5.923890923890924,
"grad_norm": 0.5218986162294897,
"learning_rate": 2.8177184670355063e-06,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04017069190740585,
"step": 7280,
"valid_targets_mean": 2531.5,
"valid_targets_min": 1045
},
{
"epoch": 5.927960927960928,
"grad_norm": 0.40603198794295736,
"learning_rate": 2.7969863802483676e-06,
"loss": 0.0666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023707497864961624,
"step": 7285,
"valid_targets_mean": 2692.0,
"valid_targets_min": 647
},
{
"epoch": 5.932030932030932,
"grad_norm": 0.61945163833617,
"learning_rate": 2.7763251105067813e-06,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09058065712451935,
"step": 7290,
"valid_targets_mean": 1831.5,
"valid_targets_min": 806
},
{
"epoch": 5.936100936100936,
"grad_norm": 0.5987985070511739,
"learning_rate": 2.755734742863876e-06,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.036716535687446594,
"step": 7295,
"valid_targets_mean": 1300.1,
"valid_targets_min": 575
},
{
"epoch": 5.94017094017094,
"grad_norm": 0.4345655736128064,
"learning_rate": 2.7352153620809053e-06,
"loss": 0.0704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03189973905682564,
"step": 7300,
"valid_targets_mean": 3615.9,
"valid_targets_min": 3193
},
{
"epoch": 5.944240944240944,
"grad_norm": 0.3798658377694568,
"learning_rate": 2.7147670526268986e-06,
"loss": 0.0699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02867596037685871,
"step": 7305,
"valid_targets_mean": 3944.1,
"valid_targets_min": 3433
},
{
"epoch": 5.948310948310948,
"grad_norm": 0.4038694045993181,
"learning_rate": 2.694389898678327e-06,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027545157819986343,
"step": 7310,
"valid_targets_mean": 2874.5,
"valid_targets_min": 767
},
{
"epoch": 5.9523809523809526,
"grad_norm": 0.4462098257681364,
"learning_rate": 2.674083984118736e-06,
"loss": 0.0641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02901633456349373,
"step": 7315,
"valid_targets_mean": 2262.1,
"valid_targets_min": 785
},
{
"epoch": 5.956450956450956,
"grad_norm": 0.7941447901126528,
"learning_rate": 2.65384939253841e-06,
"loss": 0.0865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04680174961686134,
"step": 7320,
"valid_targets_mean": 1222.8,
"valid_targets_min": 758
},
{
"epoch": 5.96052096052096,
"grad_norm": 0.6008702314886109,
"learning_rate": 2.6336862072340343e-06,
"loss": 0.0624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03380628675222397,
"step": 7325,
"valid_targets_mean": 2184.0,
"valid_targets_min": 797
},
{
"epoch": 5.964590964590965,
"grad_norm": 0.40310929667447126,
"learning_rate": 2.6135945112083506e-06,
"loss": 0.0677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031311824917793274,
"step": 7330,
"valid_targets_mean": 3445.0,
"valid_targets_min": 1606
},
{
"epoch": 5.968660968660968,
"grad_norm": 0.5761031593235989,
"learning_rate": 2.593574387169804e-06,
"loss": 0.0682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039855875074863434,
"step": 7335,
"valid_targets_mean": 2760.0,
"valid_targets_min": 678
},
{
"epoch": 5.9727309727309725,
"grad_norm": 0.3635293145604907,
"learning_rate": 2.573625917532212e-06,
"loss": 0.0731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035828523337841034,
"step": 7340,
"valid_targets_mean": 5550.0,
"valid_targets_min": 3997
},
{
"epoch": 5.976800976800977,
"grad_norm": 0.39688144504385575,
"learning_rate": 2.553749184414429e-06,
"loss": 0.0649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02166413888335228,
"step": 7345,
"valid_targets_mean": 2142.1,
"valid_targets_min": 706
},
{
"epoch": 5.980870980870981,
"grad_norm": 0.6218812931078816,
"learning_rate": 2.5339442696399897e-06,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04698009043931961,
"step": 7350,
"valid_targets_mean": 1705.0,
"valid_targets_min": 580
},
{
"epoch": 5.984940984940985,
"grad_norm": 0.6040764860465824,
"learning_rate": 2.5142112547368005e-06,
"loss": 0.0932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0763426423072815,
"step": 7355,
"valid_targets_mean": 2792.0,
"valid_targets_min": 2379
},
{
"epoch": 5.989010989010989,
"grad_norm": 0.37158486023146986,
"learning_rate": 2.494550220936773e-06,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033909812569618225,
"step": 7360,
"valid_targets_mean": 3489.0,
"valid_targets_min": 2861
},
{
"epoch": 5.993080993080993,
"grad_norm": 0.39704045184452585,
"learning_rate": 2.4749612491755158e-06,
"loss": 0.0711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03327007219195366,
"step": 7365,
"valid_targets_mean": 3850.4,
"valid_targets_min": 2453
},
{
"epoch": 5.997150997150997,
"grad_norm": 0.3981496985616391,
"learning_rate": 2.4554444200919882e-06,
"loss": 0.0662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03435596078634262,
"step": 7370,
"valid_targets_mean": 3932.9,
"valid_targets_min": 3389
},
{
"epoch": 6.0008140008140005,
"grad_norm": 0.9799010644276512,
"learning_rate": 2.4359998140281715e-06,
"loss": 0.1184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09912261366844177,
"step": 7375,
"valid_targets_mean": 8215.2,
"valid_targets_min": 6163
},
{
"epoch": 6.004884004884005,
"grad_norm": 0.958774868683029,
"learning_rate": 2.416627511028733e-06,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10130266845226288,
"step": 7380,
"valid_targets_mean": 8594.4,
"valid_targets_min": 6006
},
{
"epoch": 6.008954008954009,
"grad_norm": 0.7944310104614162,
"learning_rate": 2.39732759084071e-06,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07904568314552307,
"step": 7385,
"valid_targets_mean": 3578.4,
"valid_targets_min": 289
},
{
"epoch": 6.013024013024013,
"grad_norm": 0.6679727135866469,
"learning_rate": 2.3781001329131593e-06,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08894851803779602,
"step": 7390,
"valid_targets_mean": 7019.9,
"valid_targets_min": 4985
},
{
"epoch": 6.017094017094017,
"grad_norm": 0.5487601824765074,
"learning_rate": 2.358945216396855e-06,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08587461709976196,
"step": 7395,
"valid_targets_mean": 6956.6,
"valid_targets_min": 1457
},
{
"epoch": 6.021164021164021,
"grad_norm": 0.4456534450702924,
"learning_rate": 2.3398629201439427e-06,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08091467618942261,
"step": 7400,
"valid_targets_mean": 7361.6,
"valid_targets_min": 4961
},
{
"epoch": 6.025234025234025,
"grad_norm": 0.49514854465976493,
"learning_rate": 2.3208533227076257e-06,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10835494101047516,
"step": 7405,
"valid_targets_mean": 7058.5,
"valid_targets_min": 5985
},
{
"epoch": 6.029304029304029,
"grad_norm": 0.43486218825382905,
"learning_rate": 2.3019165023418433e-06,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09653938561677933,
"step": 7410,
"valid_targets_mean": 7664.2,
"valid_targets_min": 5169
},
{
"epoch": 6.0333740333740336,
"grad_norm": 0.4375911545615398,
"learning_rate": 2.2830525370009405e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08376707136631012,
"step": 7415,
"valid_targets_mean": 7111.8,
"valid_targets_min": 5348
},
{
"epoch": 6.037444037444037,
"grad_norm": 0.48136548478281455,
"learning_rate": 2.2642615043393512e-06,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07133744657039642,
"step": 7420,
"valid_targets_mean": 4238.9,
"valid_targets_min": 152
},
{
"epoch": 6.041514041514041,
"grad_norm": 0.4381144318946382,
"learning_rate": 2.2455434817112853e-06,
"loss": 0.1572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08667995780706406,
"step": 7425,
"valid_targets_mean": 7199.4,
"valid_targets_min": 4258
},
{
"epoch": 6.045584045584046,
"grad_norm": 0.4042301802869176,
"learning_rate": 2.226898546170384e-06,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08247347176074982,
"step": 7430,
"valid_targets_mean": 7243.4,
"valid_targets_min": 5831
},
{
"epoch": 6.04965404965405,
"grad_norm": 0.401406369618756,
"learning_rate": 2.2083267744694494e-06,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08167104423046112,
"step": 7435,
"valid_targets_mean": 6950.6,
"valid_targets_min": 3862
},
{
"epoch": 6.0537240537240535,
"grad_norm": 0.3945925382036933,
"learning_rate": 2.1898282430600727e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08647415041923523,
"step": 7440,
"valid_targets_mean": 6991.9,
"valid_targets_min": 5696
},
{
"epoch": 6.057794057794058,
"grad_norm": 0.42315972384850226,
"learning_rate": 2.171403028092367e-06,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0863867774605751,
"step": 7445,
"valid_targets_mean": 6963.5,
"valid_targets_min": 4947
},
{
"epoch": 6.061864061864062,
"grad_norm": 0.39104627702301664,
"learning_rate": 2.153051205414631e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07545962929725647,
"step": 7450,
"valid_targets_mean": 6436.9,
"valid_targets_min": 4988
},
{
"epoch": 6.065934065934066,
"grad_norm": 0.4009252559269369,
"learning_rate": 2.1347728505730392e-06,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07987205684185028,
"step": 7455,
"valid_targets_mean": 7518.0,
"valid_targets_min": 5476
},
{
"epoch": 6.07000407000407,
"grad_norm": 0.380485131548382,
"learning_rate": 2.116568038811333e-06,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07481364905834198,
"step": 7460,
"valid_targets_mean": 7422.6,
"valid_targets_min": 5226
},
{
"epoch": 6.074074074074074,
"grad_norm": 0.4378435227613099,
"learning_rate": 2.098436845070504e-06,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10386194288730621,
"step": 7465,
"valid_targets_mean": 7080.0,
"valid_targets_min": 3753
},
{
"epoch": 6.078144078144078,
"grad_norm": 0.4804949566456428,
"learning_rate": 2.080379343988497e-06,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.093023382127285,
"step": 7470,
"valid_targets_mean": 6064.6,
"valid_targets_min": 5161
},
{
"epoch": 6.082214082214082,
"grad_norm": 0.40760982947259294,
"learning_rate": 2.0623956098999056e-06,
"loss": 0.1285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07654588669538498,
"step": 7475,
"valid_targets_mean": 7388.1,
"valid_targets_min": 5795
},
{
"epoch": 6.086284086284087,
"grad_norm": 0.3959750946787557,
"learning_rate": 2.044485716835638e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07424226403236389,
"step": 7480,
"valid_targets_mean": 7696.0,
"valid_targets_min": 4658
},
{
"epoch": 6.09035409035409,
"grad_norm": 0.40969800106923865,
"learning_rate": 2.026649738522648e-06,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08557029068470001,
"step": 7485,
"valid_targets_mean": 7799.1,
"valid_targets_min": 5508
},
{
"epoch": 6.094424094424094,
"grad_norm": 0.4322454122605302,
"learning_rate": 2.00888774838361e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08102475851774216,
"step": 7490,
"valid_targets_mean": 7341.6,
"valid_targets_min": 6454
},
{
"epoch": 6.098494098494099,
"grad_norm": 0.4243940059827788,
"learning_rate": 1.9911998195366267e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07009638100862503,
"step": 7495,
"valid_targets_mean": 6818.0,
"valid_targets_min": 4392
},
{
"epoch": 6.102564102564102,
"grad_norm": 0.3901538287752902,
"learning_rate": 1.9735860247949245e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07060252130031586,
"step": 7500,
"valid_targets_mean": 7857.6,
"valid_targets_min": 5394
},
{
"epoch": 6.1066341066341066,
"grad_norm": 0.3579631569965471,
"learning_rate": 1.956046436666539e-06,
"loss": 0.1407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06699617207050323,
"step": 7505,
"valid_targets_mean": 8314.1,
"valid_targets_min": 4837
},
{
"epoch": 6.110704110704111,
"grad_norm": 0.3428888972719672,
"learning_rate": 1.938581127354049e-06,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05949755012989044,
"step": 7510,
"valid_targets_mean": 7368.2,
"valid_targets_min": 6027
},
{
"epoch": 6.114774114774114,
"grad_norm": 0.435155549282921,
"learning_rate": 1.92119016875425e-06,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07999107986688614,
"step": 7515,
"valid_targets_mean": 6435.0,
"valid_targets_min": 4238
},
{
"epoch": 6.118844118844119,
"grad_norm": 1.1395430138108782,
"learning_rate": 1.903873632457871e-06,
"loss": 0.1424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03771523758769035,
"step": 7520,
"valid_targets_mean": 247.8,
"valid_targets_min": 137
},
{
"epoch": 6.122914122914123,
"grad_norm": 0.4163271285571281,
"learning_rate": 1.8866315897492792e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07711055874824524,
"step": 7525,
"valid_targets_mean": 6807.0,
"valid_targets_min": 5165
},
{
"epoch": 6.1269841269841265,
"grad_norm": 0.4805973336300679,
"learning_rate": 1.8694641116061895e-06,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08931201696395874,
"step": 7530,
"valid_targets_mean": 6989.9,
"valid_targets_min": 5104
},
{
"epoch": 6.131054131054131,
"grad_norm": 0.48380408719281154,
"learning_rate": 1.8523712686993644e-06,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09077896177768707,
"step": 7535,
"valid_targets_mean": 6692.2,
"valid_targets_min": 5068
},
{
"epoch": 6.135124135124135,
"grad_norm": 0.4478468576523544,
"learning_rate": 1.8353531313923213e-06,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09867697954177856,
"step": 7540,
"valid_targets_mean": 7419.6,
"valid_targets_min": 5578
},
{
"epoch": 6.13919413919414,
"grad_norm": 0.41186611739704415,
"learning_rate": 1.818409769741054e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08206415176391602,
"step": 7545,
"valid_targets_mean": 7536.5,
"valid_targets_min": 5075
},
{
"epoch": 6.143264143264143,
"grad_norm": 0.3768181446141734,
"learning_rate": 1.8015412534937438e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07646715641021729,
"step": 7550,
"valid_targets_mean": 7221.5,
"valid_targets_min": 5841
},
{
"epoch": 6.147334147334147,
"grad_norm": 0.38647441084901085,
"learning_rate": 1.7847476520904528e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07809443771839142,
"step": 7555,
"valid_targets_mean": 7287.5,
"valid_targets_min": 5151
},
{
"epoch": 6.151404151404152,
"grad_norm": 0.40816468239190296,
"learning_rate": 1.7680290346628659e-06,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0784003883600235,
"step": 7560,
"valid_targets_mean": 6738.4,
"valid_targets_min": 4042
},
{
"epoch": 6.155474155474155,
"grad_norm": 0.4323305496400144,
"learning_rate": 1.7513854700339884e-06,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08970016241073608,
"step": 7565,
"valid_targets_mean": 6331.0,
"valid_targets_min": 5496
},
{
"epoch": 6.15954415954416,
"grad_norm": 0.43997280921953213,
"learning_rate": 1.7348170267178655e-06,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07909651845693588,
"step": 7570,
"valid_targets_mean": 6271.1,
"valid_targets_min": 4695
},
{
"epoch": 6.163614163614164,
"grad_norm": 0.4492944206042751,
"learning_rate": 1.7183237729193081e-06,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08394847810268402,
"step": 7575,
"valid_targets_mean": 5790.8,
"valid_targets_min": 5021
},
{
"epoch": 6.167684167684167,
"grad_norm": 0.4731995030501333,
"learning_rate": 1.7019057765335945e-06,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0583474338054657,
"step": 7580,
"valid_targets_mean": 3386.8,
"valid_targets_min": 2279
},
{
"epoch": 6.171754171754172,
"grad_norm": 0.4167788460938727,
"learning_rate": 1.6855631051462084e-06,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0789489597082138,
"step": 7585,
"valid_targets_mean": 6240.5,
"valid_targets_min": 5093
},
{
"epoch": 6.175824175824176,
"grad_norm": 0.43712455668316696,
"learning_rate": 1.6692958260325599e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08045420050621033,
"step": 7590,
"valid_targets_mean": 6329.5,
"valid_targets_min": 4589
},
{
"epoch": 6.1798941798941796,
"grad_norm": 0.402788614634297,
"learning_rate": 1.6531040061576909e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08553263545036316,
"step": 7595,
"valid_targets_mean": 7589.2,
"valid_targets_min": 4963
},
{
"epoch": 6.183964183964184,
"grad_norm": 0.41963035365571566,
"learning_rate": 1.6369877121760237e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06892232596874237,
"step": 7600,
"valid_targets_mean": 5577.9,
"valid_targets_min": 4458
},
{
"epoch": 6.188034188034188,
"grad_norm": 0.45017103457098034,
"learning_rate": 1.6209470104310666e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0763903558254242,
"step": 7605,
"valid_targets_mean": 5432.5,
"valid_targets_min": 4433
},
{
"epoch": 6.192104192104192,
"grad_norm": 0.4536922039185944,
"learning_rate": 1.604981966955157e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08348037302494049,
"step": 7610,
"valid_targets_mean": 6361.8,
"valid_targets_min": 5201
},
{
"epoch": 6.196174196174196,
"grad_norm": 0.4307255875359923,
"learning_rate": 1.5890926474691682e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07572345435619354,
"step": 7615,
"valid_targets_mean": 5824.4,
"valid_targets_min": 5129
},
{
"epoch": 6.2002442002442,
"grad_norm": 0.7193073806157995,
"learning_rate": 1.5732791173822626e-06,
"loss": 0.1234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0709250420331955,
"step": 7620,
"valid_targets_mean": 1637.6,
"valid_targets_min": 137
},
{
"epoch": 6.204314204314204,
"grad_norm": 0.418121085820752,
"learning_rate": 1.55754144179161e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07970662415027618,
"step": 7625,
"valid_targets_mean": 6474.6,
"valid_targets_min": 4751
},
{
"epoch": 6.208384208384208,
"grad_norm": 0.41818652414348384,
"learning_rate": 1.5418796854821239e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08583327382802963,
"step": 7630,
"valid_targets_mean": 7186.2,
"valid_targets_min": 5358
},
{
"epoch": 6.212454212454213,
"grad_norm": 0.4079409474648988,
"learning_rate": 1.52629391292618e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08047682046890259,
"step": 7635,
"valid_targets_mean": 7126.8,
"valid_targets_min": 4078
},
{
"epoch": 6.216524216524217,
"grad_norm": 0.41113059492418275,
"learning_rate": 1.5107841882833785e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07577785849571228,
"step": 7640,
"valid_targets_mean": 7022.1,
"valid_targets_min": 4940
},
{
"epoch": 6.22059422059422,
"grad_norm": 0.4280680246313017,
"learning_rate": 1.4953505754002562e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08161963522434235,
"step": 7645,
"valid_targets_mean": 5900.6,
"valid_targets_min": 4779
},
{
"epoch": 6.224664224664225,
"grad_norm": 0.40255377466943804,
"learning_rate": 1.4799931378100386e-06,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08172336220741272,
"step": 7650,
"valid_targets_mean": 6290.1,
"valid_targets_min": 4620
},
{
"epoch": 6.228734228734229,
"grad_norm": 0.8420012750324607,
"learning_rate": 1.4647119387323593e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05620827525854111,
"step": 7655,
"valid_targets_mean": 1162.2,
"valid_targets_min": 788
},
{
"epoch": 6.232804232804233,
"grad_norm": 0.8176601544559853,
"learning_rate": 1.4495070410730238e-06,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06722263246774673,
"step": 7660,
"valid_targets_mean": 1500.6,
"valid_targets_min": 957
},
{
"epoch": 6.236874236874237,
"grad_norm": 0.7199859456501606,
"learning_rate": 1.4343785074237393e-06,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05805957317352295,
"step": 7665,
"valid_targets_mean": 1371.2,
"valid_targets_min": 796
},
{
"epoch": 6.240944240944241,
"grad_norm": 0.8078058347677376,
"learning_rate": 1.4193264000618511e-06,
"loss": 0.1277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06448983401060104,
"step": 7670,
"valid_targets_mean": 1433.6,
"valid_targets_min": 697
},
{
"epoch": 6.245014245014245,
"grad_norm": 0.7165323289126707,
"learning_rate": 1.4043507809500923e-06,
"loss": 0.1268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06178100407123566,
"step": 7675,
"valid_targets_mean": 1578.9,
"valid_targets_min": 638
},
{
"epoch": 6.249084249084249,
"grad_norm": 0.7277559295792052,
"learning_rate": 1.3894517117363294e-06,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060996219515800476,
"step": 7680,
"valid_targets_mean": 1746.4,
"valid_targets_min": 727
},
{
"epoch": 6.253154253154253,
"grad_norm": 0.753037215595642,
"learning_rate": 1.3746292537533145e-06,
"loss": 0.1284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04994869977235794,
"step": 7685,
"valid_targets_mean": 1309.9,
"valid_targets_min": 761
},
{
"epoch": 6.257224257224257,
"grad_norm": 0.8053654916578108,
"learning_rate": 1.3598834680184124e-06,
"loss": 0.1134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06560010462999344,
"step": 7690,
"valid_targets_mean": 1368.6,
"valid_targets_min": 714
},
{
"epoch": 6.261294261294261,
"grad_norm": 0.795230502585329,
"learning_rate": 1.3452144152333734e-06,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06102893874049187,
"step": 7695,
"valid_targets_mean": 1491.8,
"valid_targets_min": 867
},
{
"epoch": 6.265364265364266,
"grad_norm": 0.7862793929838975,
"learning_rate": 1.330622155784067e-06,
"loss": 0.1255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07237902283668518,
"step": 7700,
"valid_targets_mean": 1994.0,
"valid_targets_min": 790
},
{
"epoch": 6.269434269434269,
"grad_norm": 0.8055709736092495,
"learning_rate": 1.316106749740249e-06,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05973295122385025,
"step": 7705,
"valid_targets_mean": 1523.4,
"valid_targets_min": 896
},
{
"epoch": 6.273504273504273,
"grad_norm": 1.1291501131017656,
"learning_rate": 1.3016682568552907e-06,
"loss": 0.1218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05998287722468376,
"step": 7710,
"valid_targets_mean": 1790.1,
"valid_targets_min": 1009
},
{
"epoch": 6.277574277574278,
"grad_norm": 0.7166308018469184,
"learning_rate": 1.2873067365659519e-06,
"loss": 0.1227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05086486041545868,
"step": 7715,
"valid_targets_mean": 1394.0,
"valid_targets_min": 717
},
{
"epoch": 6.281644281644281,
"grad_norm": 1.0582670753983305,
"learning_rate": 1.273022247992135e-06,
"loss": 0.1122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05162067711353302,
"step": 7720,
"valid_targets_mean": 1129.0,
"valid_targets_min": 659
},
{
"epoch": 6.285714285714286,
"grad_norm": 0.7611563612526064,
"learning_rate": 1.2588148499366405e-06,
"loss": 0.1091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054125986993312836,
"step": 7725,
"valid_targets_mean": 1466.9,
"valid_targets_min": 642
},
{
"epoch": 6.28978428978429,
"grad_norm": 0.7818498664594019,
"learning_rate": 1.2446846008849046e-06,
"loss": 0.1154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04109550267457962,
"step": 7730,
"valid_targets_mean": 1129.4,
"valid_targets_min": 765
},
{
"epoch": 6.293854293854293,
"grad_norm": 0.8675512810239565,
"learning_rate": 1.2306315590047912e-06,
"loss": 0.1264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053088150918483734,
"step": 7735,
"valid_targets_mean": 1322.8,
"valid_targets_min": 631
},
{
"epoch": 6.297924297924298,
"grad_norm": 0.9623907919932141,
"learning_rate": 1.2166557821463387e-06,
"loss": 0.1265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0787411630153656,
"step": 7740,
"valid_targets_mean": 1612.0,
"valid_targets_min": 623
},
{
"epoch": 6.301994301994302,
"grad_norm": 0.7567121449013423,
"learning_rate": 1.2027573278415129e-06,
"loss": 0.1158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046164147555828094,
"step": 7745,
"valid_targets_mean": 1402.1,
"valid_targets_min": 940
},
{
"epoch": 6.3060643060643065,
"grad_norm": 0.7882207258869738,
"learning_rate": 1.188936253303976e-06,
"loss": 0.1216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051682114601135254,
"step": 7750,
"valid_targets_mean": 1337.8,
"valid_targets_min": 776
},
{
"epoch": 6.31013431013431,
"grad_norm": 0.8346483716380687,
"learning_rate": 1.1751926154288572e-06,
"loss": 0.1195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06084754317998886,
"step": 7755,
"valid_targets_mean": 1525.5,
"valid_targets_min": 623
},
{
"epoch": 6.314204314204314,
"grad_norm": 0.7952416348423385,
"learning_rate": 1.1615264707925178e-06,
"loss": 0.1177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056195251643657684,
"step": 7760,
"valid_targets_mean": 1441.0,
"valid_targets_min": 693
},
{
"epoch": 6.318274318274319,
"grad_norm": 0.7893730311403948,
"learning_rate": 1.1479378756523008e-06,
"loss": 0.1132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03072535991668701,
"step": 7765,
"valid_targets_mean": 847.9,
"valid_targets_min": 611
},
{
"epoch": 6.322344322344322,
"grad_norm": 1.824214283992368,
"learning_rate": 1.1344268859463292e-06,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05747454613447189,
"step": 7770,
"valid_targets_mean": 1524.9,
"valid_targets_min": 793
},
{
"epoch": 6.326414326414326,
"grad_norm": 0.7591661900171986,
"learning_rate": 1.1209935572932485e-06,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060703910887241364,
"step": 7775,
"valid_targets_mean": 1779.4,
"valid_targets_min": 563
},
{
"epoch": 6.330484330484331,
"grad_norm": 0.7391670644699448,
"learning_rate": 1.1076379449920105e-06,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05903908237814903,
"step": 7780,
"valid_targets_mean": 1741.2,
"valid_targets_min": 1341
},
{
"epoch": 6.334554334554334,
"grad_norm": 0.8519469218904264,
"learning_rate": 1.0943601040216522e-06,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0688420832157135,
"step": 7785,
"valid_targets_mean": 1875.6,
"valid_targets_min": 1107
},
{
"epoch": 6.338624338624339,
"grad_norm": 0.8426833803284528,
"learning_rate": 1.0811600890410467e-06,
"loss": 0.1213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05542324483394623,
"step": 7790,
"valid_targets_mean": 1419.5,
"valid_targets_min": 680
},
{
"epoch": 6.342694342694343,
"grad_norm": 0.7888806915864902,
"learning_rate": 1.0680379543887032e-06,
"loss": 0.1109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07356111705303192,
"step": 7795,
"valid_targets_mean": 1968.2,
"valid_targets_min": 981
},
{
"epoch": 6.346764346764346,
"grad_norm": 0.8256011446110055,
"learning_rate": 1.054993754082534e-06,
"loss": 0.1173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05775183066725731,
"step": 7800,
"valid_targets_mean": 1568.9,
"valid_targets_min": 937
},
{
"epoch": 6.350834350834351,
"grad_norm": 0.8120968604513121,
"learning_rate": 1.0420275418196168e-06,
"loss": 0.1121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06070208176970482,
"step": 7805,
"valid_targets_mean": 1645.2,
"valid_targets_min": 804
},
{
"epoch": 6.354904354904355,
"grad_norm": 0.8680173034124377,
"learning_rate": 1.0291393709760044e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057425472885370255,
"step": 7810,
"valid_targets_mean": 1574.9,
"valid_targets_min": 1019
},
{
"epoch": 6.358974358974359,
"grad_norm": 0.8493112270869786,
"learning_rate": 1.0163292946064774e-06,
"loss": 0.1114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048819221556186676,
"step": 7815,
"valid_targets_mean": 1121.6,
"valid_targets_min": 882
},
{
"epoch": 6.363044363044363,
"grad_norm": 0.7714277556830921,
"learning_rate": 1.0035973654443466e-06,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05912599712610245,
"step": 7820,
"valid_targets_mean": 1818.1,
"valid_targets_min": 1168
},
{
"epoch": 6.367114367114367,
"grad_norm": 0.8847457566201997,
"learning_rate": 9.909436359012182e-07,
"loss": 0.1039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05455390363931656,
"step": 7825,
"valid_targets_mean": 1417.8,
"valid_targets_min": 678
},
{
"epoch": 6.371184371184372,
"grad_norm": 0.8899939918613994,
"learning_rate": 9.783681580667825e-07,
"loss": 0.1126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04446838051080704,
"step": 7830,
"valid_targets_mean": 1051.0,
"valid_targets_min": 676
},
{
"epoch": 6.375254375254375,
"grad_norm": 0.7355334459190873,
"learning_rate": 9.658709837086144e-07,
"loss": 0.1108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05160418897867203,
"step": 7835,
"valid_targets_mean": 1431.1,
"valid_targets_min": 794
},
{
"epoch": 6.3793243793243795,
"grad_norm": 0.7838797957111434,
"learning_rate": 9.534521642719375e-07,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05564986169338226,
"step": 7840,
"valid_targets_mean": 1486.9,
"valid_targets_min": 742
},
{
"epoch": 6.383394383394384,
"grad_norm": 0.7965717627384523,
"learning_rate": 9.411117508794309e-07,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06882425397634506,
"step": 7845,
"valid_targets_mean": 1734.5,
"valid_targets_min": 741
},
{
"epoch": 6.387464387464387,
"grad_norm": 0.8893222531203173,
"learning_rate": 9.288497943310082e-07,
"loss": 0.1183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06830059736967087,
"step": 7850,
"valid_targets_mean": 1712.5,
"valid_targets_min": 1157
},
{
"epoch": 6.391534391534392,
"grad_norm": 0.8161513544565203,
"learning_rate": 9.166663451036118e-07,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06825710833072662,
"step": 7855,
"valid_targets_mean": 1723.8,
"valid_targets_min": 862
},
{
"epoch": 6.395604395604396,
"grad_norm": 0.8646112978766813,
"learning_rate": 9.045614533510072e-07,
"loss": 0.1186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06607664376497269,
"step": 7860,
"valid_targets_mean": 1633.1,
"valid_targets_min": 1019
},
{
"epoch": 6.399674399674399,
"grad_norm": 0.7626824305794315,
"learning_rate": 8.925351689035722e-07,
"loss": 0.1161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04722012206912041,
"step": 7865,
"valid_targets_mean": 1376.1,
"valid_targets_min": 1058
},
{
"epoch": 6.403744403744404,
"grad_norm": 0.840691332087647,
"learning_rate": 8.80587541268092e-07,
"loss": 0.1293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05784667283296585,
"step": 7870,
"valid_targets_mean": 1576.5,
"valid_targets_min": 618
},
{
"epoch": 6.407814407814408,
"grad_norm": 0.8207659704590586,
"learning_rate": 8.687186196275643e-07,
"loss": 0.1103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06569144874811172,
"step": 7875,
"valid_targets_mean": 1615.8,
"valid_targets_min": 629
},
{
"epoch": 6.411884411884412,
"grad_norm": 0.9326833663597143,
"learning_rate": 8.56928452840975e-07,
"loss": 0.1147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06420698761940002,
"step": 7880,
"valid_targets_mean": 1881.2,
"valid_targets_min": 1167
},
{
"epoch": 6.415954415954416,
"grad_norm": 0.8554904869093989,
"learning_rate": 8.452170894431267e-07,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05731596797704697,
"step": 7885,
"valid_targets_mean": 1367.2,
"valid_targets_min": 699
},
{
"epoch": 6.42002442002442,
"grad_norm": 0.8406972937569153,
"learning_rate": 8.335845776444218e-07,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04333464428782463,
"step": 7890,
"valid_targets_mean": 1174.9,
"valid_targets_min": 679
},
{
"epoch": 6.424094424094424,
"grad_norm": 0.8085860922583763,
"learning_rate": 8.22030965330658e-07,
"loss": 0.1085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.054415322840213776,
"step": 7895,
"valid_targets_mean": 1556.2,
"valid_targets_min": 504
},
{
"epoch": 6.428164428164428,
"grad_norm": 0.7792125188992498,
"learning_rate": 8.10556300062848e-07,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06440182030200958,
"step": 7900,
"valid_targets_mean": 1885.0,
"valid_targets_min": 1331
},
{
"epoch": 6.4322344322344325,
"grad_norm": 0.9287716280023119,
"learning_rate": 7.991606290770093e-07,
"loss": 0.1095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041307710111141205,
"step": 7905,
"valid_targets_mean": 1306.1,
"valid_targets_min": 661
},
{
"epoch": 6.436304436304436,
"grad_norm": 0.866709090318928,
"learning_rate": 7.878439992839815e-07,
"loss": 0.1149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0448264516890049,
"step": 7910,
"valid_targets_mean": 1330.1,
"valid_targets_min": 958
},
{
"epoch": 6.44037444037444,
"grad_norm": 0.7657298637604557,
"learning_rate": 7.766064572692178e-07,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04386502504348755,
"step": 7915,
"valid_targets_mean": 1465.0,
"valid_targets_min": 963
},
{
"epoch": 6.444444444444445,
"grad_norm": 0.8273726055440597,
"learning_rate": 7.65448049292612e-07,
"loss": 0.1128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05073707178235054,
"step": 7920,
"valid_targets_mean": 1428.0,
"valid_targets_min": 793
},
{
"epoch": 6.448514448514448,
"grad_norm": 0.8400987990779193,
"learning_rate": 7.54368821288296e-07,
"loss": 0.1093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06966409087181091,
"step": 7925,
"valid_targets_mean": 1633.1,
"valid_targets_min": 917
},
{
"epoch": 6.4525844525844525,
"grad_norm": 0.781744242763993,
"learning_rate": 7.433688188644517e-07,
"loss": 0.1127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04392581433057785,
"step": 7930,
"valid_targets_mean": 1246.5,
"valid_targets_min": 872
},
{
"epoch": 6.456654456654457,
"grad_norm": 0.8099440855665998,
"learning_rate": 7.324480873031281e-07,
"loss": 0.1119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05493423342704773,
"step": 7935,
"valid_targets_mean": 1903.6,
"valid_targets_min": 1220
},
{
"epoch": 6.46072446072446,
"grad_norm": 0.8303935015673607,
"learning_rate": 7.216066715600489e-07,
"loss": 0.1,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04634704440832138,
"step": 7940,
"valid_targets_mean": 1391.6,
"valid_targets_min": 712
},
{
"epoch": 6.464794464794465,
"grad_norm": 0.8580005093462261,
"learning_rate": 7.1084461626443e-07,
"loss": 0.106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053560368716716766,
"step": 7945,
"valid_targets_mean": 1295.0,
"valid_targets_min": 605
},
{
"epoch": 6.468864468864469,
"grad_norm": 0.7965111105826138,
"learning_rate": 7.001619657187996e-07,
"loss": 0.1173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04019693285226822,
"step": 7950,
"valid_targets_mean": 1414.8,
"valid_targets_min": 746
},
{
"epoch": 6.472934472934473,
"grad_norm": 0.8678383738827472,
"learning_rate": 6.895587638988077e-07,
"loss": 0.1022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044681429862976074,
"step": 7955,
"valid_targets_mean": 1059.4,
"valid_targets_min": 723
},
{
"epoch": 6.477004477004477,
"grad_norm": 0.8017716642473961,
"learning_rate": 6.790350544530522e-07,
"loss": 0.1093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06314340978860855,
"step": 7960,
"valid_targets_mean": 1634.2,
"valid_targets_min": 1327
},
{
"epoch": 6.481074481074481,
"grad_norm": 0.8064315437918422,
"learning_rate": 6.685908807028996e-07,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04939217120409012,
"step": 7965,
"valid_targets_mean": 1412.5,
"valid_targets_min": 902
},
{
"epoch": 6.4851444851444855,
"grad_norm": 0.8311002011404962,
"learning_rate": 6.582262856423005e-07,
"loss": 0.1101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05105116218328476,
"step": 7970,
"valid_targets_mean": 1558.8,
"valid_targets_min": 803
},
{
"epoch": 6.489214489214489,
"grad_norm": 0.8917053809677671,
"learning_rate": 6.479413119376143e-07,
"loss": 0.1131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05821871757507324,
"step": 7975,
"valid_targets_mean": 1441.2,
"valid_targets_min": 1079
},
{
"epoch": 6.493284493284493,
"grad_norm": 0.7886247369918117,
"learning_rate": 6.377360019274425e-07,
"loss": 0.1054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04788671433925629,
"step": 7980,
"valid_targets_mean": 1449.8,
"valid_targets_min": 1263
},
{
"epoch": 6.497354497354498,
"grad_norm": 0.8165623190693444,
"learning_rate": 6.276103976224401e-07,
"loss": 0.1116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05484423413872719,
"step": 7985,
"valid_targets_mean": 1487.4,
"valid_targets_min": 844
},
{
"epoch": 6.501424501424501,
"grad_norm": 0.9134655853507222,
"learning_rate": 6.175645407051467e-07,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05332685261964798,
"step": 7990,
"valid_targets_mean": 1421.4,
"valid_targets_min": 667
},
{
"epoch": 6.5054945054945055,
"grad_norm": 0.8551082037730058,
"learning_rate": 6.075984725298245e-07,
"loss": 0.1151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06440360844135284,
"step": 7995,
"valid_targets_mean": 1822.6,
"valid_targets_min": 1041
},
{
"epoch": 6.50956450956451,
"grad_norm": 0.8385108112647772,
"learning_rate": 5.977122341222852e-07,
"loss": 0.1129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046396177262067795,
"step": 8000,
"valid_targets_mean": 1327.4,
"valid_targets_min": 777
},
{
"epoch": 6.513634513634513,
"grad_norm": 0.8465014974527149,
"learning_rate": 5.879058661797055e-07,
"loss": 0.1111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05752868950366974,
"step": 8005,
"valid_targets_mean": 1823.8,
"valid_targets_min": 1283
},
{
"epoch": 6.517704517704518,
"grad_norm": 0.8181274172180951,
"learning_rate": 5.781794090704806e-07,
"loss": 0.1041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0392225906252861,
"step": 8010,
"valid_targets_mean": 924.0,
"valid_targets_min": 620
},
{
"epoch": 6.521774521774522,
"grad_norm": 0.8248876924646297,
"learning_rate": 5.685329028340492e-07,
"loss": 0.1049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045971810817718506,
"step": 8015,
"valid_targets_mean": 1480.2,
"valid_targets_min": 656
},
{
"epoch": 6.5258445258445255,
"grad_norm": 0.8286128442083801,
"learning_rate": 5.589663871807216e-07,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04419014975428581,
"step": 8020,
"valid_targets_mean": 1415.5,
"valid_targets_min": 697
},
{
"epoch": 6.52991452991453,
"grad_norm": 0.8155469269825053,
"learning_rate": 5.494799014915275e-07,
"loss": 0.1055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049654521048069,
"step": 8025,
"valid_targets_mean": 1655.8,
"valid_targets_min": 816
},
{
"epoch": 6.533984533984534,
"grad_norm": 0.8136069829867537,
"learning_rate": 5.400734848180467e-07,
"loss": 0.1001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04807547852396965,
"step": 8030,
"valid_targets_mean": 1553.0,
"valid_targets_min": 850
},
{
"epoch": 6.5380545380545385,
"grad_norm": 0.8744821289828539,
"learning_rate": 5.307471758822557e-07,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052176572382450104,
"step": 8035,
"valid_targets_mean": 1353.9,
"valid_targets_min": 747
},
{
"epoch": 6.542124542124542,
"grad_norm": 0.7918578875775583,
"learning_rate": 5.215010130763576e-07,
"loss": 0.113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04798971116542816,
"step": 8040,
"valid_targets_mean": 1420.9,
"valid_targets_min": 933
},
{
"epoch": 6.546194546194546,
"grad_norm": 0.8293804879113885,
"learning_rate": 5.123350344626343e-07,
"loss": 0.106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.053255513310432434,
"step": 8045,
"valid_targets_mean": 1394.9,
"valid_targets_min": 827
},
{
"epoch": 6.550264550264551,
"grad_norm": 0.7710088076942784,
"learning_rate": 5.032492777732856e-07,
"loss": 0.1042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04495897516608238,
"step": 8050,
"valid_targets_mean": 1383.2,
"valid_targets_min": 909
},
{
"epoch": 6.554334554334554,
"grad_norm": 0.7408488115343422,
"learning_rate": 4.942437804102729e-07,
"loss": 0.1065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05502689629793167,
"step": 8055,
"valid_targets_mean": 1682.4,
"valid_targets_min": 1094
},
{
"epoch": 6.5584045584045585,
"grad_norm": 0.8161047493613602,
"learning_rate": 4.853185794451643e-07,
"loss": 0.0979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04552149027585983,
"step": 8060,
"valid_targets_mean": 1118.4,
"valid_targets_min": 720
},
{
"epoch": 6.562474562474563,
"grad_norm": 0.810699986703739,
"learning_rate": 4.7647371161898547e-07,
"loss": 0.1075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04979178309440613,
"step": 8065,
"valid_targets_mean": 1538.2,
"valid_targets_min": 610
},
{
"epoch": 6.566544566544566,
"grad_norm": 0.7810924502619642,
"learning_rate": 4.677092133420647e-07,
"loss": 0.1015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05203615128993988,
"step": 8070,
"valid_targets_mean": 1570.1,
"valid_targets_min": 713
},
{
"epoch": 6.570614570614571,
"grad_norm": 0.8664468115638617,
"learning_rate": 4.5902512069389006e-07,
"loss": 0.1088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.050125155597925186,
"step": 8075,
"valid_targets_mean": 1537.8,
"valid_targets_min": 874
},
{
"epoch": 6.574684574684575,
"grad_norm": 0.784693140282473,
"learning_rate": 4.504214694229525e-07,
"loss": 0.1066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051420196890830994,
"step": 8080,
"valid_targets_mean": 1471.2,
"valid_targets_min": 765
},
{
"epoch": 6.5787545787545785,
"grad_norm": 0.8589862191743883,
"learning_rate": 4.418982949466011e-07,
"loss": 0.1028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04462102800607681,
"step": 8085,
"valid_targets_mean": 1254.4,
"valid_targets_min": 816
},
{
"epoch": 6.582824582824583,
"grad_norm": 0.8700836145069042,
"learning_rate": 4.334556323509009e-07,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04805884137749672,
"step": 8090,
"valid_targets_mean": 1482.9,
"valid_targets_min": 1182
},
{
"epoch": 6.586894586894587,
"grad_norm": 0.6773547787375108,
"learning_rate": 4.25093516390489e-07,
"loss": 0.1102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0742184966802597,
"step": 8095,
"valid_targets_mean": 1583.2,
"valid_targets_min": 363
},
{
"epoch": 6.590964590964591,
"grad_norm": 0.49684846547746847,
"learning_rate": 4.1681198148841415e-07,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04401320964097977,
"step": 8100,
"valid_targets_mean": 3710.1,
"valid_targets_min": 3074
},
{
"epoch": 6.595034595034595,
"grad_norm": 0.5269822498666787,
"learning_rate": 4.0861106173602837e-07,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04181273281574249,
"step": 8105,
"valid_targets_mean": 2577.6,
"valid_targets_min": 700
},
{
"epoch": 6.599104599104599,
"grad_norm": 0.5319878660224543,
"learning_rate": 4.004907908928135e-07,
"loss": 0.0794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03852052986621857,
"step": 8110,
"valid_targets_mean": 3309.8,
"valid_targets_min": 803
},
{
"epoch": 6.603174603174603,
"grad_norm": 0.4436363617952094,
"learning_rate": 3.9245120238626144e-07,
"loss": 0.0727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03728438913822174,
"step": 8115,
"valid_targets_mean": 2484.8,
"valid_targets_min": 920
},
{
"epoch": 6.607244607244607,
"grad_norm": 0.4833719991023813,
"learning_rate": 3.8449232931173195e-07,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039660267531871796,
"step": 8120,
"valid_targets_mean": 3095.1,
"valid_targets_min": 806
},
{
"epoch": 6.6113146113146115,
"grad_norm": 0.7829899471206379,
"learning_rate": 3.766142044323129e-07,
"loss": 0.1153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06311972439289093,
"step": 8125,
"valid_targets_mean": 1663.1,
"valid_targets_min": 718
},
{
"epoch": 6.615384615384615,
"grad_norm": 0.4509111643360801,
"learning_rate": 3.688168601786912e-07,
"loss": 0.0836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0408773347735405,
"step": 8130,
"valid_targets_mean": 3443.2,
"valid_targets_min": 1133
},
{
"epoch": 6.619454619454619,
"grad_norm": 0.5161079431546142,
"learning_rate": 3.6110032864901776e-07,
"loss": 0.0832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03457147255539894,
"step": 8135,
"valid_targets_mean": 1609.9,
"valid_targets_min": 859
},
{
"epoch": 6.623524623524624,
"grad_norm": 0.3376406967796116,
"learning_rate": 3.5346464160876945e-07,
"loss": 0.1058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02600034326314926,
"step": 8140,
"valid_targets_mean": 5572.1,
"valid_targets_min": 5150
},
{
"epoch": 6.627594627594627,
"grad_norm": 0.4907063131191801,
"learning_rate": 3.459098304906228e-07,
"loss": 0.0679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04523205757141113,
"step": 8145,
"valid_targets_mean": 3950.0,
"valid_targets_min": 502
},
{
"epoch": 6.6316646316646315,
"grad_norm": 0.4380405824798826,
"learning_rate": 3.384359263943271e-07,
"loss": 0.0722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04171394184231758,
"step": 8150,
"valid_targets_mean": 3669.2,
"valid_targets_min": 600
},
{
"epoch": 6.635734635734636,
"grad_norm": 0.41061389847454,
"learning_rate": 3.310429600865739e-07,
"loss": 0.0688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030914265662431717,
"step": 8155,
"valid_targets_mean": 2980.4,
"valid_targets_min": 518
},
{
"epoch": 6.639804639804639,
"grad_norm": 0.43198145452754944,
"learning_rate": 3.237309620008722e-07,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0387565903365612,
"step": 8160,
"valid_targets_mean": 3675.4,
"valid_targets_min": 549
},
{
"epoch": 6.643874643874644,
"grad_norm": 0.35792992132158885,
"learning_rate": 3.1649996223741765e-07,
"loss": 0.0646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027515945956110954,
"step": 8165,
"valid_targets_mean": 4013.2,
"valid_targets_min": 3548
},
{
"epoch": 6.647944647944648,
"grad_norm": 0.47471099164218855,
"learning_rate": 3.093499905629727e-07,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038465503603219986,
"step": 8170,
"valid_targets_mean": 2000.5,
"valid_targets_min": 644
},
{
"epoch": 6.652014652014652,
"grad_norm": 0.32225997700337605,
"learning_rate": 3.022810764107487e-07,
"loss": 0.0596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02280164137482643,
"step": 8175,
"valid_targets_mean": 2904.4,
"valid_targets_min": 720
},
{
"epoch": 6.656084656084656,
"grad_norm": 0.5895755914253757,
"learning_rate": 2.9529324888027287e-07,
"loss": 0.0797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.028042782098054886,
"step": 8180,
"valid_targets_mean": 1487.6,
"valid_targets_min": 516
},
{
"epoch": 6.66015466015466,
"grad_norm": 0.5222751795102811,
"learning_rate": 2.8838653673727514e-07,
"loss": 0.0781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048454202711582184,
"step": 8185,
"valid_targets_mean": 2006.0,
"valid_targets_min": 557
},
{
"epoch": 6.6642246642246645,
"grad_norm": 0.5326599642169098,
"learning_rate": 2.8156096841357893e-07,
"loss": 0.0833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04685577005147934,
"step": 8190,
"valid_targets_mean": 3359.2,
"valid_targets_min": 1086
},
{
"epoch": 6.668294668294668,
"grad_norm": 0.48322360350526905,
"learning_rate": 2.748165720069684e-07,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05052535608410835,
"step": 8195,
"valid_targets_mean": 2866.8,
"valid_targets_min": 1008
},
{
"epoch": 6.672364672364672,
"grad_norm": 0.5129442984365581,
"learning_rate": 2.6815337528107723e-07,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03285352140665054,
"step": 8200,
"valid_targets_mean": 3259.9,
"valid_targets_min": 2702
},
{
"epoch": 6.676434676434677,
"grad_norm": 0.3692290656961646,
"learning_rate": 2.615714056652841e-07,
"loss": 0.0686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030034877359867096,
"step": 8205,
"valid_targets_mean": 4086.4,
"valid_targets_min": 3798
},
{
"epoch": 6.68050468050468,
"grad_norm": 0.8498455958044546,
"learning_rate": 2.5507069025458855e-07,
"loss": 0.0841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06665704399347305,
"step": 8210,
"valid_targets_mean": 1020.8,
"valid_targets_min": 598
},
{
"epoch": 6.6845746845746845,
"grad_norm": 0.4283220379269479,
"learning_rate": 2.486512558095e-07,
"loss": 0.0925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02849685214459896,
"step": 8215,
"valid_targets_mean": 2028.4,
"valid_targets_min": 590
},
{
"epoch": 6.688644688644689,
"grad_norm": 0.4312912789027484,
"learning_rate": 2.423131287559355e-07,
"loss": 0.0879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0402199849486351,
"step": 8220,
"valid_targets_mean": 4046.9,
"valid_targets_min": 3390
},
{
"epoch": 6.692714692714693,
"grad_norm": 0.6525867542972212,
"learning_rate": 2.3605633518510195e-07,
"loss": 0.1139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12717895209789276,
"step": 8225,
"valid_targets_mean": 2247.4,
"valid_targets_min": 984
},
{
"epoch": 6.696784696784697,
"grad_norm": 0.48625518043675997,
"learning_rate": 2.2988090085339864e-07,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04617800936102867,
"step": 8230,
"valid_targets_mean": 3348.9,
"valid_targets_min": 2176
},
{
"epoch": 6.700854700854701,
"grad_norm": 0.5666484347927709,
"learning_rate": 2.237868511823016e-07,
"loss": 0.0802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038623686879873276,
"step": 8235,
"valid_targets_mean": 2385.1,
"valid_targets_min": 1074
},
{
"epoch": 6.704924704924705,
"grad_norm": 0.4480717010310978,
"learning_rate": 2.1777421125826593e-07,
"loss": 0.0848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03942921385169029,
"step": 8240,
"valid_targets_mean": 3126.2,
"valid_targets_min": 1212
},
{
"epoch": 6.708994708994709,
"grad_norm": 0.447193589815513,
"learning_rate": 2.1184300583261263e-07,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04053179919719696,
"step": 8245,
"valid_targets_mean": 4386.0,
"valid_targets_min": 2258
},
{
"epoch": 6.713064713064713,
"grad_norm": 0.37115709592990564,
"learning_rate": 2.059932593214442e-07,
"loss": 0.066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05170625448226929,
"step": 8250,
"valid_targets_mean": 3738.9,
"valid_targets_min": 1466
},
{
"epoch": 6.7171347171347175,
"grad_norm": 0.3666621308583359,
"learning_rate": 2.0022499580552247e-07,
"loss": 0.08,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033547915518283844,
"step": 8255,
"valid_targets_mean": 3522.6,
"valid_targets_min": 560
},
{
"epoch": 6.721204721204721,
"grad_norm": 0.41360520779368637,
"learning_rate": 1.9453823903019086e-07,
"loss": 0.0817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04005451872944832,
"step": 8260,
"valid_targets_mean": 3383.1,
"valid_targets_min": 1189
},
{
"epoch": 6.725274725274725,
"grad_norm": 0.39520542502071915,
"learning_rate": 1.8893301240525463e-07,
"loss": 0.0672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03196336701512337,
"step": 8265,
"valid_targets_mean": 3610.1,
"valid_targets_min": 2257
},
{
"epoch": 6.72934472934473,
"grad_norm": 0.37918993485934277,
"learning_rate": 1.8340933900490965e-07,
"loss": 0.0652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026241963729262352,
"step": 8270,
"valid_targets_mean": 3479.8,
"valid_targets_min": 886
},
{
"epoch": 6.733414733414733,
"grad_norm": 0.4561669870328987,
"learning_rate": 1.7796724156762258e-07,
"loss": 0.0729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03602328151464462,
"step": 8275,
"valid_targets_mean": 3346.6,
"valid_targets_min": 2409
},
{
"epoch": 6.7374847374847375,
"grad_norm": 0.4635371928947697,
"learning_rate": 1.726067424960576e-07,
"loss": 0.0654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031619295477867126,
"step": 8280,
"valid_targets_mean": 3552.0,
"valid_targets_min": 2309
},
{
"epoch": 6.741554741554742,
"grad_norm": 0.7003118747711201,
"learning_rate": 1.6732786385696754e-07,
"loss": 0.1105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0696185976266861,
"step": 8285,
"valid_targets_mean": 2149.8,
"valid_targets_min": 645
},
{
"epoch": 6.745624745624745,
"grad_norm": 0.3594856692476842,
"learning_rate": 1.6213062738111407e-07,
"loss": 0.06,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02745797298848629,
"step": 8290,
"valid_targets_mean": 3310.2,
"valid_targets_min": 545
},
{
"epoch": 6.74969474969475,
"grad_norm": 0.474912995800518,
"learning_rate": 1.5701505446317656e-07,
"loss": 0.0601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03320920467376709,
"step": 8295,
"valid_targets_mean": 2458.4,
"valid_targets_min": 667
},
{
"epoch": 6.753764753764754,
"grad_norm": 0.3593430573149411,
"learning_rate": 1.5198116616165881e-07,
"loss": 0.0608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02956734225153923,
"step": 8300,
"valid_targets_mean": 3501.5,
"valid_targets_min": 2353
},
{
"epoch": 6.7578347578347575,
"grad_norm": 0.4694070743198895,
"learning_rate": 1.4702898319881142e-07,
"loss": 0.0628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04120086506009102,
"step": 8305,
"valid_targets_mean": 3220.2,
"valid_targets_min": 792
},
{
"epoch": 6.761904761904762,
"grad_norm": 0.39254754104169143,
"learning_rate": 1.421585259605318e-07,
"loss": 0.1059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027905117720365524,
"step": 8310,
"valid_targets_mean": 3818.5,
"valid_targets_min": 3276
},
{
"epoch": 6.765974765974766,
"grad_norm": 0.4934206140709475,
"learning_rate": 1.3736981449629982e-07,
"loss": 0.0929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048690035939216614,
"step": 8315,
"valid_targets_mean": 2390.9,
"valid_targets_min": 647
},
{
"epoch": 6.77004477004477,
"grad_norm": 0.5152362898858448,
"learning_rate": 1.3266286851907783e-07,
"loss": 0.0741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041787609457969666,
"step": 8320,
"valid_targets_mean": 1500.6,
"valid_targets_min": 673
},
{
"epoch": 6.774114774114774,
"grad_norm": 0.7351478599697331,
"learning_rate": 1.280377074052397e-07,
"loss": 0.0919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08116742968559265,
"step": 8325,
"valid_targets_mean": 1711.2,
"valid_targets_min": 702
},
{
"epoch": 6.778184778184778,
"grad_norm": 0.47783788496330504,
"learning_rate": 1.234943501944863e-07,
"loss": 0.1044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04755005985498428,
"step": 8330,
"valid_targets_mean": 3036.1,
"valid_targets_min": 945
},
{
"epoch": 6.782254782254782,
"grad_norm": 0.5018792752451303,
"learning_rate": 1.1903281558976798e-07,
"loss": 0.0772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.051417913287878036,
"step": 8335,
"valid_targets_mean": 3317.2,
"valid_targets_min": 2265
},
{
"epoch": 6.786324786324786,
"grad_norm": 0.3439978747787152,
"learning_rate": 1.1465312195721334e-07,
"loss": 0.0935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03338252753019333,
"step": 8340,
"valid_targets_mean": 3875.2,
"valid_targets_min": 3051
},
{
"epoch": 6.7903947903947905,
"grad_norm": 0.4903813555602027,
"learning_rate": 1.1035528732604272e-07,
"loss": 0.0747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05204244330525398,
"step": 8345,
"valid_targets_mean": 2069.8,
"valid_targets_min": 523
},
{
"epoch": 6.794464794464794,
"grad_norm": 0.3832807020853381,
"learning_rate": 1.0613932938850157e-07,
"loss": 0.0698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03278394788503647,
"step": 8350,
"valid_targets_mean": 1640.8,
"valid_targets_min": 468
},
{
"epoch": 6.798534798534798,
"grad_norm": 0.3608814015492147,
"learning_rate": 1.020052654997894e-07,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022406112402677536,
"step": 8355,
"valid_targets_mean": 4435.1,
"valid_targets_min": 885
},
{
"epoch": 6.802604802604803,
"grad_norm": 0.3861502768165619,
"learning_rate": 9.79531126779798e-08,
"loss": 0.0654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025468919426202774,
"step": 8360,
"valid_targets_mean": 1889.2,
"valid_targets_min": 546
},
{
"epoch": 6.806674806674806,
"grad_norm": 0.38892792716177965,
"learning_rate": 9.398288760395836e-08,
"loss": 0.0662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03875254467129707,
"step": 8365,
"valid_targets_mean": 4257.1,
"valid_targets_min": 2414
},
{
"epoch": 6.8107448107448105,
"grad_norm": 0.5353675959388392,
"learning_rate": 9.009460662134928e-08,
"loss": 0.079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043166883289813995,
"step": 8370,
"valid_targets_mean": 1502.4,
"valid_targets_min": 697
},
{
"epoch": 6.814814814814815,
"grad_norm": 0.4502618811767403,
"learning_rate": 8.628828573645554e-08,
"loss": 0.0813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039157938212156296,
"step": 8375,
"valid_targets_mean": 3466.0,
"valid_targets_min": 2777
},
{
"epoch": 6.818884818884819,
"grad_norm": 0.44084545531435015,
"learning_rate": 8.256394061817663e-08,
"loss": 0.0841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043219827115535736,
"step": 8380,
"valid_targets_mean": 3982.1,
"valid_targets_min": 3061
},
{
"epoch": 6.822954822954823,
"grad_norm": 0.37363497568335224,
"learning_rate": 7.892158659796422e-08,
"loss": 0.0682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034288160502910614,
"step": 8385,
"valid_targets_mean": 2788.0,
"valid_targets_min": 868
},
{
"epoch": 6.827024827024827,
"grad_norm": 0.3799289990411093,
"learning_rate": 7.536123866974665e-08,
"loss": 0.0738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02917984500527382,
"step": 8390,
"valid_targets_mean": 2120.6,
"valid_targets_min": 752
},
{
"epoch": 6.831094831094831,
"grad_norm": 0.3835533743706495,
"learning_rate": 7.188291148986892e-08,
"loss": 0.077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03172875568270683,
"step": 8395,
"valid_targets_mean": 3477.1,
"valid_targets_min": 1141
},
{
"epoch": 6.835164835164835,
"grad_norm": 0.34008156095211195,
"learning_rate": 6.848661937703727e-08,
"loss": 0.0577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03241172060370445,
"step": 8400,
"valid_targets_mean": 3888.4,
"valid_targets_min": 3540
},
{
"epoch": 6.839234839234839,
"grad_norm": 0.4090753301091059,
"learning_rate": 6.517237631225026e-08,
"loss": 0.0768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027315791696310043,
"step": 8405,
"valid_targets_mean": 3086.8,
"valid_targets_min": 773
},
{
"epoch": 6.843304843304844,
"grad_norm": 0.39701062406863746,
"learning_rate": 6.194019593875444e-08,
"loss": 0.0726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025227008387446404,
"step": 8410,
"valid_targets_mean": 3558.6,
"valid_targets_min": 2587
},
{
"epoch": 6.847374847374847,
"grad_norm": 0.4392394924145199,
"learning_rate": 5.879009156197768e-08,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03493019938468933,
"step": 8415,
"valid_targets_mean": 2688.9,
"valid_targets_min": 773
},
{
"epoch": 6.851444851444851,
"grad_norm": 0.5083647411957302,
"learning_rate": 5.572207614947589e-08,
"loss": 0.0732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03646247088909149,
"step": 8420,
"valid_targets_mean": 3734.4,
"valid_targets_min": 3068
},
{
"epoch": 6.855514855514856,
"grad_norm": 0.628171717161323,
"learning_rate": 5.273616233088641e-08,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04628308117389679,
"step": 8425,
"valid_targets_mean": 1816.1,
"valid_targets_min": 893
},
{
"epoch": 6.85958485958486,
"grad_norm": 0.6087268426251439,
"learning_rate": 4.983236239787026e-08,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04026108980178833,
"step": 8430,
"valid_targets_mean": 1444.4,
"valid_targets_min": 708
},
{
"epoch": 6.8636548636548635,
"grad_norm": 0.4335028192076854,
"learning_rate": 4.701068830405886e-08,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029476728290319443,
"step": 8435,
"valid_targets_mean": 1768.8,
"valid_targets_min": 617
},
{
"epoch": 6.867724867724868,
"grad_norm": 0.45556499572135306,
"learning_rate": 4.4271151665014055e-08,
"loss": 0.0718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03315385431051254,
"step": 8440,
"valid_targets_mean": 2634.9,
"valid_targets_min": 720
},
{
"epoch": 6.871794871794872,
"grad_norm": 0.5629937228346741,
"learning_rate": 4.161376375817039e-08,
"loss": 0.0661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04290713742375374,
"step": 8445,
"valid_targets_mean": 1836.2,
"valid_targets_min": 785
},
{
"epoch": 6.875864875864876,
"grad_norm": 0.5669698114208702,
"learning_rate": 3.903853552279513e-08,
"loss": 0.0872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06467582285404205,
"step": 8450,
"valid_targets_mean": 2148.2,
"valid_targets_min": 765
},
{
"epoch": 6.87993487993488,
"grad_norm": 0.30486345935213593,
"learning_rate": 3.654547755994164e-08,
"loss": 0.0651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019002530723810196,
"step": 8455,
"valid_targets_mean": 3639.2,
"valid_targets_min": 2863
},
{
"epoch": 6.884004884004884,
"grad_norm": 0.38454514502865644,
"learning_rate": 3.413460013240499e-08,
"loss": 0.0655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026053160429000854,
"step": 8460,
"valid_targets_mean": 3033.4,
"valid_targets_min": 555
},
{
"epoch": 6.888074888074888,
"grad_norm": 0.4941087528400253,
"learning_rate": 3.180591316467974e-08,
"loss": 0.0745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04288317263126373,
"step": 8465,
"valid_targets_mean": 2346.6,
"valid_targets_min": 721
},
{
"epoch": 6.892144892144892,
"grad_norm": 0.3509155023887329,
"learning_rate": 2.9559426242919964e-08,
"loss": 0.0606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03283192217350006,
"step": 8470,
"valid_targets_mean": 4902.1,
"valid_targets_min": 3640
},
{
"epoch": 6.896214896214897,
"grad_norm": 0.4037435152095895,
"learning_rate": 2.7395148614897115e-08,
"loss": 0.0617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03601628914475441,
"step": 8475,
"valid_targets_mean": 4536.6,
"valid_targets_min": 2020
},
{
"epoch": 6.9002849002849,
"grad_norm": 0.34603119742925265,
"learning_rate": 2.5313089189966665e-08,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025459568947553635,
"step": 8480,
"valid_targets_mean": 3218.6,
"valid_targets_min": 739
},
{
"epoch": 6.904354904354904,
"grad_norm": 0.4268602714698763,
"learning_rate": 2.331325653902816e-08,
"loss": 0.0945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03908785805106163,
"step": 8485,
"valid_targets_mean": 3774.6,
"valid_targets_min": 2945
},
{
"epoch": 6.908424908424909,
"grad_norm": 0.4557025570243415,
"learning_rate": 2.139565889448969e-08,
"loss": 0.07,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04192078113555908,
"step": 8490,
"valid_targets_mean": 3045.4,
"valid_targets_min": 704
},
{
"epoch": 6.912494912494912,
"grad_norm": 0.4093961592946955,
"learning_rate": 1.9560304150234576e-08,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030827539041638374,
"step": 8495,
"valid_targets_mean": 2492.8,
"valid_targets_min": 774
},
{
"epoch": 6.916564916564917,
"grad_norm": 0.4284938895525246,
"learning_rate": 1.7807199861594736e-08,
"loss": 0.0906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02964516170322895,
"step": 8500,
"valid_targets_mean": 2564.6,
"valid_targets_min": 485
},
{
"epoch": 6.920634920634921,
"grad_norm": 0.43820381846708467,
"learning_rate": 1.613635324530405e-08,
"loss": 0.0682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03012934699654579,
"step": 8505,
"valid_targets_mean": 3002.5,
"valid_targets_min": 1048
},
{
"epoch": 6.924704924704924,
"grad_norm": 0.4182221488232721,
"learning_rate": 1.4547771179487246e-08,
"loss": 0.0721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.032236211001873016,
"step": 8510,
"valid_targets_mean": 2588.5,
"valid_targets_min": 722
},
{
"epoch": 6.928774928774929,
"grad_norm": 0.5356394748249438,
"learning_rate": 1.304146020361996e-08,
"loss": 0.0757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04836539924144745,
"step": 8515,
"valid_targets_mean": 1443.8,
"valid_targets_min": 865
},
{
"epoch": 6.932844932844933,
"grad_norm": 0.4971988244053681,
"learning_rate": 1.1617426518504283e-08,
"loss": 0.1033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03724466264247894,
"step": 8520,
"valid_targets_mean": 2283.1,
"valid_targets_min": 675
},
{
"epoch": 6.9369149369149365,
"grad_norm": 0.41438516750308313,
"learning_rate": 1.0275675986242128e-08,
"loss": 0.0913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03457161411643028,
"step": 8525,
"valid_targets_mean": 3202.0,
"valid_targets_min": 782
},
{
"epoch": 6.940984940984941,
"grad_norm": 0.4720882472008192,
"learning_rate": 9.016214130219692e-09,
"loss": 0.0686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03335484117269516,
"step": 8530,
"valid_targets_mean": 2586.9,
"valid_targets_min": 795
},
{
"epoch": 6.945054945054945,
"grad_norm": 0.4477158642708563,
"learning_rate": 7.839046135069695e-09,
"loss": 0.069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.033690642565488815,
"step": 8535,
"valid_targets_mean": 3345.4,
"valid_targets_min": 2017
},
{
"epoch": 6.949124949124949,
"grad_norm": 0.4310573655106279,
"learning_rate": 6.744176846664729e-09,
"loss": 0.0679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029223371297121048,
"step": 8540,
"valid_targets_mean": 1937.5,
"valid_targets_min": 798
},
{
"epoch": 6.953194953194953,
"grad_norm": 0.37061900269005643,
"learning_rate": 5.731610772083951e-09,
"loss": 0.0597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029739029705524445,
"step": 8545,
"valid_targets_mean": 3302.2,
"valid_targets_min": 860
},
{
"epoch": 6.957264957264957,
"grad_norm": 0.39293408289174847,
"learning_rate": 4.801352079606414e-09,
"loss": 0.0844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03068091720342636,
"step": 8550,
"valid_targets_mean": 3287.2,
"valid_targets_min": 878
},
{
"epoch": 6.961334961334961,
"grad_norm": 0.36550971062080234,
"learning_rate": 3.9534045986888706e-09,
"loss": 0.0616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.026515811681747437,
"step": 8555,
"valid_targets_mean": 3800.8,
"valid_targets_min": 2602
},
{
"epoch": 6.965404965404965,
"grad_norm": 0.5094035280811099,
"learning_rate": 3.1877718199480045e-09,
"loss": 0.0705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04128776118159294,
"step": 8560,
"valid_targets_mean": 2853.9,
"valid_targets_min": 945
},
{
"epoch": 6.96947496947497,
"grad_norm": 0.43630707115728157,
"learning_rate": 2.5044568951471114e-09,
"loss": 0.0678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042031463235616684,
"step": 8565,
"valid_targets_mean": 3633.9,
"valid_targets_min": 2059
},
{
"epoch": 6.973544973544973,
"grad_norm": 0.4179577364933974,
"learning_rate": 1.9034626371872147e-09,
"loss": 0.0713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03878530487418175,
"step": 8570,
"valid_targets_mean": 4244.8,
"valid_targets_min": 2529
},
{
"epoch": 6.977614977614977,
"grad_norm": 0.3982770165173577,
"learning_rate": 1.3847915200893015e-09,
"loss": 0.0615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04271527752280235,
"step": 8575,
"valid_targets_mean": 4650.8,
"valid_targets_min": 892
},
{
"epoch": 6.981684981684982,
"grad_norm": 0.28047291358880216,
"learning_rate": 9.484456789876639e-10,
"loss": 0.065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02087704837322235,
"step": 8580,
"valid_targets_mean": 4432.1,
"valid_targets_min": 1657
},
{
"epoch": 6.985754985754986,
"grad_norm": 0.6547087358433034,
"learning_rate": 5.944269101232358e-10,
"loss": 0.1178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09982357919216156,
"step": 8585,
"valid_targets_mean": 2023.0,
"valid_targets_min": 709
},
{
"epoch": 6.98982498982499,
"grad_norm": 0.3577008023192031,
"learning_rate": 3.2273667083027036e-10,
"loss": 0.1045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027526959776878357,
"step": 8590,
"valid_targets_mean": 3241.9,
"valid_targets_min": 527
},
{
"epoch": 6.993894993894994,
"grad_norm": 0.4179136407746658,
"learning_rate": 1.3337607953634034e-10,
"loss": 0.0743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04843872785568237,
"step": 8595,
"valid_targets_mean": 3313.4,
"valid_targets_min": 2308
},
{
"epoch": 6.997964997964998,
"grad_norm": 0.3512093714041848,
"learning_rate": 2.6345915753456243e-11,
"loss": 0.0599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0316237136721611,
"step": 8600,
"valid_targets_mean": 3463.5,
"valid_targets_min": 2883
},
{
"epoch": 6.999592999592999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04449460655450821,
"step": 8602,
"total_flos": 2.7561038524606054e+18,
"train_loss": 0.015238219677667456,
"train_runtime": 26280.0507,
"train_samples_per_second": 5.235,
"train_steps_per_second": 0.327,
"valid_targets_mean": 4028.4,
"valid_targets_min": 1273
}
],
"logging_steps": 5,
"max_steps": 8603,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 2.7561038524606054e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}