Files
Qwen3-8B_exp_tas_tmux_large…/trainer_state.json
ModelHub XC 6c0ef39b44 初始化项目,由ModelHub XC社区提供模型
Model: laion/Qwen3-8B_exp_tas_tmux_large_traces_save-strategy_steps
Source: Original Platform
2026-06-03 04:24:20 +08:00

5625 lines
156 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 8.0,
"eval_steps": 500,
"global_step": 2536,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.015772870662460567,
"grad_norm": 2.169656955227513,
"learning_rate": 3.0769230769230774e-05,
"loss": 0.9249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.817986011505127,
"step": 5,
"valid_targets_mean": 3434.8,
"valid_targets_min": 744
},
{
"epoch": 0.031545741324921134,
"grad_norm": 0.8559043399532138,
"learning_rate": 6.923076923076924e-05,
"loss": 0.7835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7119892835617065,
"step": 10,
"valid_targets_mean": 3699.3,
"valid_targets_min": 1231
},
{
"epoch": 0.0473186119873817,
"grad_norm": 0.6757245841747609,
"learning_rate": 9.99999612380875e-05,
"loss": 0.6389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6657205820083618,
"step": 15,
"valid_targets_mean": 3761.8,
"valid_targets_min": 751
},
{
"epoch": 0.06309148264984227,
"grad_norm": 0.5457612768667142,
"learning_rate": 9.999860457746025e-05,
"loss": 0.6338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6094217300415039,
"step": 20,
"valid_targets_mean": 3539.5,
"valid_targets_min": 981
},
{
"epoch": 0.07886435331230283,
"grad_norm": 0.5562908717471081,
"learning_rate": 9.999530988130677e-05,
"loss": 0.6127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6498370170593262,
"step": 25,
"valid_targets_mean": 3522.9,
"valid_targets_min": 1087
},
{
"epoch": 0.0946372239747634,
"grad_norm": 0.5548782107356937,
"learning_rate": 9.999007727733537e-05,
"loss": 0.6193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.594431459903717,
"step": 30,
"valid_targets_mean": 2975.7,
"valid_targets_min": 1141
},
{
"epoch": 0.11041009463722397,
"grad_norm": 0.4872105480697271,
"learning_rate": 9.998290696837115e-05,
"loss": 0.5795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5703617334365845,
"step": 35,
"valid_targets_mean": 3581.2,
"valid_targets_min": 628
},
{
"epoch": 0.12618296529968454,
"grad_norm": 0.4858873354273939,
"learning_rate": 9.997379923234816e-05,
"loss": 0.5804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5455387830734253,
"step": 40,
"valid_targets_mean": 3317.4,
"valid_targets_min": 700
},
{
"epoch": 0.14195583596214512,
"grad_norm": 0.5108147907048001,
"learning_rate": 9.996275442229857e-05,
"loss": 0.5701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5683155655860901,
"step": 45,
"valid_targets_mean": 3741.8,
"valid_targets_min": 682
},
{
"epoch": 0.15772870662460567,
"grad_norm": 0.5274941244563711,
"learning_rate": 9.994977296633902e-05,
"loss": 0.5859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6010461449623108,
"step": 50,
"valid_targets_mean": 3634.8,
"valid_targets_min": 1082
},
{
"epoch": 0.17350157728706625,
"grad_norm": 0.5937423674749936,
"learning_rate": 9.993485536765398e-05,
"loss": 0.5602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5546848773956299,
"step": 55,
"valid_targets_mean": 4297.9,
"valid_targets_min": 650
},
{
"epoch": 0.1892744479495268,
"grad_norm": 0.4747000855685691,
"learning_rate": 9.991800220447634e-05,
"loss": 0.5922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5315375328063965,
"step": 60,
"valid_targets_mean": 3689.7,
"valid_targets_min": 961
},
{
"epoch": 0.20504731861198738,
"grad_norm": 0.5010503817387185,
"learning_rate": 9.989921413006489e-05,
"loss": 0.5805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6408827304840088,
"step": 65,
"valid_targets_mean": 3859.3,
"valid_targets_min": 1319
},
{
"epoch": 0.22082018927444794,
"grad_norm": 0.468284305556988,
"learning_rate": 9.987849187267908e-05,
"loss": 0.5505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5802025198936462,
"step": 70,
"valid_targets_mean": 3437.2,
"valid_targets_min": 658
},
{
"epoch": 0.23659305993690852,
"grad_norm": 0.4456626356470159,
"learning_rate": 9.985583623555076e-05,
"loss": 0.5571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5259662866592407,
"step": 75,
"valid_targets_mean": 3729.0,
"valid_targets_min": 821
},
{
"epoch": 0.25236593059936907,
"grad_norm": 0.5189246417709207,
"learning_rate": 9.9831248096853e-05,
"loss": 0.5465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5496809482574463,
"step": 80,
"valid_targets_mean": 3154.8,
"valid_targets_min": 844
},
{
"epoch": 0.26813880126182965,
"grad_norm": 0.4242414929398914,
"learning_rate": 9.980472840966614e-05,
"loss": 0.558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5265679955482483,
"step": 85,
"valid_targets_mean": 4139.5,
"valid_targets_min": 869
},
{
"epoch": 0.28391167192429023,
"grad_norm": 0.4360826931800694,
"learning_rate": 9.977627820194082e-05,
"loss": 0.5496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5053580403327942,
"step": 90,
"valid_targets_mean": 4189.2,
"valid_targets_min": 815
},
{
"epoch": 0.2996845425867508,
"grad_norm": 0.45768598697634005,
"learning_rate": 9.974589857645802e-05,
"loss": 0.5503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5525804758071899,
"step": 95,
"valid_targets_mean": 3723.3,
"valid_targets_min": 721
},
{
"epoch": 0.31545741324921134,
"grad_norm": 0.45279563265028255,
"learning_rate": 9.97135907107865e-05,
"loss": 0.5593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5906380414962769,
"step": 100,
"valid_targets_mean": 4154.5,
"valid_targets_min": 1312
},
{
"epoch": 0.3312302839116719,
"grad_norm": 0.41876449974133445,
"learning_rate": 9.967935585723706e-05,
"loss": 0.5566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.552190899848938,
"step": 105,
"valid_targets_mean": 4490.0,
"valid_targets_min": 1513
},
{
"epoch": 0.3470031545741325,
"grad_norm": 0.4041961807602131,
"learning_rate": 9.964319534281397e-05,
"loss": 0.562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5655333995819092,
"step": 110,
"valid_targets_mean": 4229.1,
"valid_targets_min": 1399
},
{
"epoch": 0.3627760252365931,
"grad_norm": 0.4960566105435021,
"learning_rate": 9.960511056916357e-05,
"loss": 0.5599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5781254768371582,
"step": 115,
"valid_targets_mean": 3706.1,
"valid_targets_min": 801
},
{
"epoch": 0.3785488958990536,
"grad_norm": 0.4459682147440665,
"learning_rate": 9.956510301251995e-05,
"loss": 0.5354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.499944269657135,
"step": 120,
"valid_targets_mean": 3662.9,
"valid_targets_min": 749
},
{
"epoch": 0.3943217665615142,
"grad_norm": 0.3929671447186755,
"learning_rate": 9.952317422364772e-05,
"loss": 0.5783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5153095722198486,
"step": 125,
"valid_targets_mean": 4084.0,
"valid_targets_min": 1164
},
{
"epoch": 0.41009463722397477,
"grad_norm": 0.42897401373515004,
"learning_rate": 9.947932582778188e-05,
"loss": 0.5513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5479700565338135,
"step": 130,
"valid_targets_mean": 3615.9,
"valid_targets_min": 1030
},
{
"epoch": 0.42586750788643535,
"grad_norm": 0.4514170365892061,
"learning_rate": 9.943355952456483e-05,
"loss": 0.5508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5287145376205444,
"step": 135,
"valid_targets_mean": 3968.4,
"valid_targets_min": 1382
},
{
"epoch": 0.4416403785488959,
"grad_norm": 0.4885467964555453,
"learning_rate": 9.938587708798053e-05,
"loss": 0.5545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6355825066566467,
"step": 140,
"valid_targets_mean": 3822.2,
"valid_targets_min": 994
},
{
"epoch": 0.45741324921135645,
"grad_norm": 0.45050804505844816,
"learning_rate": 9.933628036628569e-05,
"loss": 0.5707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5147861242294312,
"step": 145,
"valid_targets_mean": 4422.2,
"valid_targets_min": 840
},
{
"epoch": 0.47318611987381703,
"grad_norm": 0.4629732361929168,
"learning_rate": 9.92847712819381e-05,
"loss": 0.5351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5328657031059265,
"step": 150,
"valid_targets_mean": 3415.7,
"valid_targets_min": 834
},
{
"epoch": 0.4889589905362776,
"grad_norm": 0.4247700925965094,
"learning_rate": 9.923135183152224e-05,
"loss": 0.5435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5141998529434204,
"step": 155,
"valid_targets_mean": 4627.2,
"valid_targets_min": 1094
},
{
"epoch": 0.5047318611987381,
"grad_norm": 0.3810890570531183,
"learning_rate": 9.91760240856717e-05,
"loss": 0.5583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5300256609916687,
"step": 160,
"valid_targets_mean": 4273.2,
"valid_targets_min": 1231
},
{
"epoch": 0.5205047318611987,
"grad_norm": 0.4096717090938379,
"learning_rate": 9.91187901889891e-05,
"loss": 0.5518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5601193904876709,
"step": 165,
"valid_targets_mean": 3646.8,
"valid_targets_min": 825
},
{
"epoch": 0.5362776025236593,
"grad_norm": 0.42309669942651534,
"learning_rate": 9.905965235996286e-05,
"loss": 0.5438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5901980400085449,
"step": 170,
"valid_targets_mean": 3763.0,
"valid_targets_min": 1202
},
{
"epoch": 0.5520504731861199,
"grad_norm": 0.4221962263816931,
"learning_rate": 9.899861289088121e-05,
"loss": 0.5728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5548031330108643,
"step": 175,
"valid_targets_mean": 3372.2,
"valid_targets_min": 1078
},
{
"epoch": 0.5678233438485805,
"grad_norm": 0.4533484589368771,
"learning_rate": 9.893567414774341e-05,
"loss": 0.5182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5485403537750244,
"step": 180,
"valid_targets_mean": 3786.9,
"valid_targets_min": 813
},
{
"epoch": 0.583596214511041,
"grad_norm": 0.4201455517245677,
"learning_rate": 9.88708385701679e-05,
"loss": 0.5362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5464404821395874,
"step": 185,
"valid_targets_mean": 4054.2,
"valid_targets_min": 718
},
{
"epoch": 0.5993690851735016,
"grad_norm": 0.3816172170313495,
"learning_rate": 9.88041086712979e-05,
"loss": 0.5185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5385897159576416,
"step": 190,
"valid_targets_mean": 3817.4,
"valid_targets_min": 865
},
{
"epoch": 0.6151419558359621,
"grad_norm": 0.38750216847876323,
"learning_rate": 9.873548703770388e-05,
"loss": 0.5143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4823839068412781,
"step": 195,
"valid_targets_mean": 4086.1,
"valid_targets_min": 967
},
{
"epoch": 0.6309148264984227,
"grad_norm": 0.40503340868678855,
"learning_rate": 9.866497632928336e-05,
"loss": 0.5225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5157015919685364,
"step": 200,
"valid_targets_mean": 4078.6,
"valid_targets_min": 950
},
{
"epoch": 0.6466876971608833,
"grad_norm": 0.3541231531701395,
"learning_rate": 9.859257927915774e-05,
"loss": 0.5376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5179704427719116,
"step": 205,
"valid_targets_mean": 3903.1,
"valid_targets_min": 699
},
{
"epoch": 0.6624605678233438,
"grad_norm": 0.41202758172155246,
"learning_rate": 9.851829869356651e-05,
"loss": 0.522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5223180055618286,
"step": 210,
"valid_targets_mean": 4136.1,
"valid_targets_min": 1128
},
{
"epoch": 0.6782334384858044,
"grad_norm": 0.423543405280611,
"learning_rate": 9.844213745175826e-05,
"loss": 0.5332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5781832337379456,
"step": 215,
"valid_targets_mean": 3915.7,
"valid_targets_min": 1093
},
{
"epoch": 0.694006309148265,
"grad_norm": 0.35669299013566746,
"learning_rate": 9.83640985058792e-05,
"loss": 0.5092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47874531149864197,
"step": 220,
"valid_targets_mean": 3844.2,
"valid_targets_min": 742
},
{
"epoch": 0.7097791798107256,
"grad_norm": 0.3925005403471201,
"learning_rate": 9.828418488085877e-05,
"loss": 0.5302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5382158756256104,
"step": 225,
"valid_targets_mean": 3521.7,
"valid_targets_min": 1095
},
{
"epoch": 0.7255520504731862,
"grad_norm": 0.4325120394989433,
"learning_rate": 9.820239967429233e-05,
"loss": 0.5371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5795000791549683,
"step": 230,
"valid_targets_mean": 3122.2,
"valid_targets_min": 641
},
{
"epoch": 0.7413249211356467,
"grad_norm": 0.36208200156129844,
"learning_rate": 9.811874605632104e-05,
"loss": 0.5283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5075106620788574,
"step": 235,
"valid_targets_mean": 4049.4,
"valid_targets_min": 691
},
{
"epoch": 0.7570977917981072,
"grad_norm": 0.39540549433667344,
"learning_rate": 9.803322726950905e-05,
"loss": 0.5378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5728358626365662,
"step": 240,
"valid_targets_mean": 4206.9,
"valid_targets_min": 996
},
{
"epoch": 0.7728706624605678,
"grad_norm": 0.41657667507777546,
"learning_rate": 9.794584662871787e-05,
"loss": 0.5135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5691760778427124,
"step": 245,
"valid_targets_mean": 3891.3,
"valid_targets_min": 717
},
{
"epoch": 0.7886435331230284,
"grad_norm": 0.36129818659509033,
"learning_rate": 9.785660752097768e-05,
"loss": 0.511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49009859561920166,
"step": 250,
"valid_targets_mean": 4718.1,
"valid_targets_min": 1376
},
{
"epoch": 0.804416403785489,
"grad_norm": 0.3954585394141833,
"learning_rate": 9.77655134053563e-05,
"loss": 0.5271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5566205978393555,
"step": 255,
"valid_targets_mean": 3992.4,
"valid_targets_min": 922
},
{
"epoch": 0.8201892744479495,
"grad_norm": 0.4457152822998143,
"learning_rate": 9.767256781282486e-05,
"loss": 0.5459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5469316244125366,
"step": 260,
"valid_targets_mean": 3295.2,
"valid_targets_min": 942
},
{
"epoch": 0.8359621451104101,
"grad_norm": 0.42830831852575374,
"learning_rate": 9.757777434612116e-05,
"loss": 0.5321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5643436908721924,
"step": 265,
"valid_targets_mean": 3402.6,
"valid_targets_min": 849
},
{
"epoch": 0.8517350157728707,
"grad_norm": 0.35560598847559505,
"learning_rate": 9.748113667960987e-05,
"loss": 0.5416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5399414300918579,
"step": 270,
"valid_targets_mean": 4290.6,
"valid_targets_min": 801
},
{
"epoch": 0.8675078864353313,
"grad_norm": 0.3318267291185689,
"learning_rate": 9.738265855914013e-05,
"loss": 0.4984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5012451410293579,
"step": 275,
"valid_targets_mean": 4652.2,
"valid_targets_min": 1522
},
{
"epoch": 0.8832807570977917,
"grad_norm": 0.37641165858900405,
"learning_rate": 9.728234380190038e-05,
"loss": 0.5217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5358394384384155,
"step": 280,
"valid_targets_mean": 3566.7,
"valid_targets_min": 356
},
{
"epoch": 0.8990536277602523,
"grad_norm": 0.3707422402953193,
"learning_rate": 9.718019629627045e-05,
"loss": 0.5383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5315133333206177,
"step": 285,
"valid_targets_mean": 4248.1,
"valid_targets_min": 1506
},
{
"epoch": 0.9148264984227129,
"grad_norm": 0.36379579886903163,
"learning_rate": 9.70762200016707e-05,
"loss": 0.5156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49599626660346985,
"step": 290,
"valid_targets_mean": 3829.4,
"valid_targets_min": 319
},
{
"epoch": 0.9305993690851735,
"grad_norm": 0.3602052757244127,
"learning_rate": 9.697041894840865e-05,
"loss": 0.5172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5145964622497559,
"step": 295,
"valid_targets_mean": 3755.7,
"valid_targets_min": 1000
},
{
"epoch": 0.9463722397476341,
"grad_norm": 0.3383105129798826,
"learning_rate": 9.68627972375228e-05,
"loss": 0.5197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5156067609786987,
"step": 300,
"valid_targets_mean": 4581.9,
"valid_targets_min": 1023
},
{
"epoch": 0.9621451104100947,
"grad_norm": 0.39478296443847477,
"learning_rate": 9.675335904062353e-05,
"loss": 0.509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5009207129478455,
"step": 305,
"valid_targets_mean": 3574.9,
"valid_targets_min": 704
},
{
"epoch": 0.9779179810725552,
"grad_norm": 0.3701507161997181,
"learning_rate": 9.66421085997315e-05,
"loss": 0.515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5108104944229126,
"step": 310,
"valid_targets_mean": 3732.2,
"valid_targets_min": 663
},
{
"epoch": 0.9936908517350158,
"grad_norm": 0.36362679379892143,
"learning_rate": 9.65290502271132e-05,
"loss": 0.5298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5177055597305298,
"step": 315,
"valid_targets_mean": 4006.8,
"valid_targets_min": 862
},
{
"epoch": 1.0094637223974763,
"grad_norm": 0.44494333561483296,
"learning_rate": 9.641418830511377e-05,
"loss": 0.469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4171540141105652,
"step": 320,
"valid_targets_mean": 3149.5,
"valid_targets_min": 519
},
{
"epoch": 1.025236593059937,
"grad_norm": 0.3391573696995791,
"learning_rate": 9.62975272859872e-05,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39022213220596313,
"step": 325,
"valid_targets_mean": 4175.0,
"valid_targets_min": 1192
},
{
"epoch": 1.0410094637223974,
"grad_norm": 0.4148022873924609,
"learning_rate": 9.617907169172367e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4439923167228699,
"step": 330,
"valid_targets_mean": 3986.2,
"valid_targets_min": 869
},
{
"epoch": 1.0567823343848581,
"grad_norm": 0.3565887954497388,
"learning_rate": 9.605882611387432e-05,
"loss": 0.4526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44107919931411743,
"step": 335,
"valid_targets_mean": 4259.3,
"valid_targets_min": 976
},
{
"epoch": 1.0725552050473186,
"grad_norm": 0.3907577587630456,
"learning_rate": 9.593679521337327e-05,
"loss": 0.4484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45283353328704834,
"step": 340,
"valid_targets_mean": 3893.7,
"valid_targets_min": 1418
},
{
"epoch": 1.088328075709779,
"grad_norm": 0.3807742307702375,
"learning_rate": 9.581298372035695e-05,
"loss": 0.4302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4250805675983429,
"step": 345,
"valid_targets_mean": 3853.0,
"valid_targets_min": 965
},
{
"epoch": 1.1041009463722398,
"grad_norm": 0.44905191912330616,
"learning_rate": 9.56873964339807e-05,
"loss": 0.4462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5217335224151611,
"step": 350,
"valid_targets_mean": 2976.3,
"valid_targets_min": 827
},
{
"epoch": 1.1198738170347002,
"grad_norm": 0.3699538409851181,
"learning_rate": 9.556003822223287e-05,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3780270218849182,
"step": 355,
"valid_targets_mean": 4304.0,
"valid_targets_min": 863
},
{
"epoch": 1.135646687697161,
"grad_norm": 0.38031489838469096,
"learning_rate": 9.5430914021746e-05,
"loss": 0.4371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4074738323688507,
"step": 360,
"valid_targets_mean": 3196.3,
"valid_targets_min": 1161
},
{
"epoch": 1.1514195583596214,
"grad_norm": 0.382134493241582,
"learning_rate": 9.530002883760552e-05,
"loss": 0.4218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43987852334976196,
"step": 365,
"valid_targets_mean": 3962.5,
"valid_targets_min": 899
},
{
"epoch": 1.167192429022082,
"grad_norm": 0.37585063446780165,
"learning_rate": 9.516738774315577e-05,
"loss": 0.4395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4138225018978119,
"step": 370,
"valid_targets_mean": 3164.1,
"valid_targets_min": 762
},
{
"epoch": 1.1829652996845426,
"grad_norm": 0.3805495887688742,
"learning_rate": 9.503299587980331e-05,
"loss": 0.4434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44806328415870667,
"step": 375,
"valid_targets_mean": 3578.8,
"valid_targets_min": 623
},
{
"epoch": 1.1987381703470033,
"grad_norm": 0.376773409845666,
"learning_rate": 9.489685845681762e-05,
"loss": 0.4428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4336075186729431,
"step": 380,
"valid_targets_mean": 3914.1,
"valid_targets_min": 961
},
{
"epoch": 1.2145110410094637,
"grad_norm": 0.38804566747120484,
"learning_rate": 9.47589807511292e-05,
"loss": 0.4292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4264313876628876,
"step": 385,
"valid_targets_mean": 3593.9,
"valid_targets_min": 742
},
{
"epoch": 1.2302839116719242,
"grad_norm": 0.36513112328321634,
"learning_rate": 9.461936810712507e-05,
"loss": 0.4611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47045087814331055,
"step": 390,
"valid_targets_mean": 4321.6,
"valid_targets_min": 1088
},
{
"epoch": 1.2460567823343849,
"grad_norm": 0.39079786099369523,
"learning_rate": 9.447802593644152e-05,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5255352258682251,
"step": 395,
"valid_targets_mean": 3777.8,
"valid_targets_min": 898
},
{
"epoch": 1.2618296529968454,
"grad_norm": 0.3398501520957368,
"learning_rate": 9.433495971775444e-05,
"loss": 0.4169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4048163890838623,
"step": 400,
"valid_targets_mean": 4000.7,
"valid_targets_min": 1370
},
{
"epoch": 1.277602523659306,
"grad_norm": 0.3670308220814651,
"learning_rate": 9.419017499656686e-05,
"loss": 0.4393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4233490228652954,
"step": 405,
"valid_targets_mean": 3596.8,
"valid_targets_min": 835
},
{
"epoch": 1.2933753943217665,
"grad_norm": 0.40227891912103875,
"learning_rate": 9.404367738499409e-05,
"loss": 0.4616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.465755432844162,
"step": 410,
"valid_targets_mean": 3719.0,
"valid_targets_min": 854
},
{
"epoch": 1.3091482649842272,
"grad_norm": 0.35283201135451225,
"learning_rate": 9.38954725615461e-05,
"loss": 0.4729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45133858919143677,
"step": 415,
"valid_targets_mean": 4254.4,
"valid_targets_min": 646
},
{
"epoch": 1.3249211356466877,
"grad_norm": 0.3570013813746019,
"learning_rate": 9.374556627090749e-05,
"loss": 0.4627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4204801619052887,
"step": 420,
"valid_targets_mean": 3770.4,
"valid_targets_min": 337
},
{
"epoch": 1.3406940063091484,
"grad_norm": 0.37223503941855,
"learning_rate": 9.359396432371476e-05,
"loss": 0.4677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5173239707946777,
"step": 425,
"valid_targets_mean": 4230.2,
"valid_targets_min": 1114
},
{
"epoch": 1.3564668769716088,
"grad_norm": 0.3301770644383114,
"learning_rate": 9.344067259633112e-05,
"loss": 0.4323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.398292601108551,
"step": 430,
"valid_targets_mean": 4243.5,
"valid_targets_min": 1054
},
{
"epoch": 1.3722397476340693,
"grad_norm": 0.36270954698851193,
"learning_rate": 9.328569703061862e-05,
"loss": 0.4336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45556944608688354,
"step": 435,
"valid_targets_mean": 3909.2,
"valid_targets_min": 671
},
{
"epoch": 1.38801261829653,
"grad_norm": 0.37539857073698474,
"learning_rate": 9.3129043633708e-05,
"loss": 0.4421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4796835482120514,
"step": 440,
"valid_targets_mean": 4132.4,
"valid_targets_min": 658
},
{
"epoch": 1.4037854889589905,
"grad_norm": 0.33638929802502493,
"learning_rate": 9.297071847776568e-05,
"loss": 0.4423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4059070646762848,
"step": 445,
"valid_targets_mean": 3642.7,
"valid_targets_min": 726
},
{
"epoch": 1.4195583596214512,
"grad_norm": 0.4001184728503333,
"learning_rate": 9.281072769975847e-05,
"loss": 0.4443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47804516553878784,
"step": 450,
"valid_targets_mean": 3378.8,
"valid_targets_min": 758
},
{
"epoch": 1.4353312302839116,
"grad_norm": 0.4029482297411805,
"learning_rate": 9.264907750121568e-05,
"loss": 0.4334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44277799129486084,
"step": 455,
"valid_targets_mean": 3196.6,
"valid_targets_min": 841
},
{
"epoch": 1.4511041009463723,
"grad_norm": 0.4036784853782572,
"learning_rate": 9.248577414798871e-05,
"loss": 0.4416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43349453806877136,
"step": 460,
"valid_targets_mean": 3283.0,
"valid_targets_min": 635
},
{
"epoch": 1.4668769716088328,
"grad_norm": 0.36312925454919104,
"learning_rate": 9.232082397000826e-05,
"loss": 0.4275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4773409962654114,
"step": 465,
"valid_targets_mean": 3814.1,
"valid_targets_min": 691
},
{
"epoch": 1.4826498422712935,
"grad_norm": 0.3528726566779447,
"learning_rate": 9.215423336103884e-05,
"loss": 0.4431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4232112765312195,
"step": 470,
"valid_targets_mean": 4029.1,
"valid_targets_min": 335
},
{
"epoch": 1.498422712933754,
"grad_norm": 0.41683241533869353,
"learning_rate": 9.198600877843105e-05,
"loss": 0.4412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48993387818336487,
"step": 475,
"valid_targets_mean": 2998.8,
"valid_targets_min": 977
},
{
"epoch": 1.5141955835962144,
"grad_norm": 0.34971035022348906,
"learning_rate": 9.181615674287121e-05,
"loss": 0.4461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43452027440071106,
"step": 480,
"valid_targets_mean": 4365.5,
"valid_targets_min": 1207
},
{
"epoch": 1.5299684542586751,
"grad_norm": 0.7751137379112104,
"learning_rate": 9.164468383812864e-05,
"loss": 0.4403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4532795548439026,
"step": 485,
"valid_targets_mean": 3795.7,
"valid_targets_min": 1359
},
{
"epoch": 1.5457413249211358,
"grad_norm": 0.401862455648203,
"learning_rate": 9.147159671080049e-05,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4684237539768219,
"step": 490,
"valid_targets_mean": 3587.4,
"valid_targets_min": 666
},
{
"epoch": 1.5615141955835963,
"grad_norm": 0.37373814768090685,
"learning_rate": 9.129690207005402e-05,
"loss": 0.4551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4561198949813843,
"step": 495,
"valid_targets_mean": 3667.8,
"valid_targets_min": 1183
},
{
"epoch": 1.5772870662460567,
"grad_norm": 0.3475217588458817,
"learning_rate": 9.11206066873666e-05,
"loss": 0.439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43660348653793335,
"step": 500,
"valid_targets_mean": 3716.6,
"valid_targets_min": 717
},
{
"epoch": 1.5930599369085172,
"grad_norm": 0.4051905185882745,
"learning_rate": 9.094271739626326e-05,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43010252714157104,
"step": 505,
"valid_targets_mean": 2970.6,
"valid_targets_min": 702
},
{
"epoch": 1.608832807570978,
"grad_norm": 0.34036475182222864,
"learning_rate": 9.076324109205174e-05,
"loss": 0.4507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4386584162712097,
"step": 510,
"valid_targets_mean": 3959.9,
"valid_targets_min": 589
},
{
"epoch": 1.6246056782334386,
"grad_norm": 0.3498122275381102,
"learning_rate": 9.058218473155528e-05,
"loss": 0.4333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4222657084465027,
"step": 515,
"valid_targets_mean": 3462.6,
"valid_targets_min": 873
},
{
"epoch": 1.640378548895899,
"grad_norm": 0.3369248339344111,
"learning_rate": 9.039955533284292e-05,
"loss": 0.4527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4398431181907654,
"step": 520,
"valid_targets_mean": 3989.6,
"valid_targets_min": 1064
},
{
"epoch": 1.6561514195583595,
"grad_norm": 0.36080386098017403,
"learning_rate": 9.021535997495749e-05,
"loss": 0.471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48137784004211426,
"step": 525,
"valid_targets_mean": 3954.6,
"valid_targets_min": 866
},
{
"epoch": 1.6719242902208202,
"grad_norm": 0.3718481057610134,
"learning_rate": 9.002960579764116e-05,
"loss": 0.4503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4851943254470825,
"step": 530,
"valid_targets_mean": 3200.0,
"valid_targets_min": 440
},
{
"epoch": 1.687697160883281,
"grad_norm": 0.36465288551264813,
"learning_rate": 8.984230000105882e-05,
"loss": 0.4455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4893612265586853,
"step": 535,
"valid_targets_mean": 3724.4,
"valid_targets_min": 1164
},
{
"epoch": 1.7034700315457414,
"grad_norm": 0.32735990049855485,
"learning_rate": 8.965344984551882e-05,
"loss": 0.4431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38390782475471497,
"step": 540,
"valid_targets_mean": 3728.2,
"valid_targets_min": 765
},
{
"epoch": 1.7192429022082019,
"grad_norm": 0.3405505588639974,
"learning_rate": 8.946306265119167e-05,
"loss": 0.434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4467661380767822,
"step": 545,
"valid_targets_mean": 3709.7,
"valid_targets_min": 1553
},
{
"epoch": 1.7350157728706623,
"grad_norm": 0.3652479819607644,
"learning_rate": 8.927114579782625e-05,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43158066272735596,
"step": 550,
"valid_targets_mean": 3628.7,
"valid_targets_min": 882
},
{
"epoch": 1.750788643533123,
"grad_norm": 0.3822997428821815,
"learning_rate": 8.907770672446381e-05,
"loss": 0.4574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4463322162628174,
"step": 555,
"valid_targets_mean": 3338.1,
"valid_targets_min": 789
},
{
"epoch": 1.7665615141955837,
"grad_norm": 0.3485646535388207,
"learning_rate": 8.888275292914948e-05,
"loss": 0.4397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42743009328842163,
"step": 560,
"valid_targets_mean": 3594.6,
"valid_targets_min": 721
},
{
"epoch": 1.7823343848580442,
"grad_norm": 0.3109895750423863,
"learning_rate": 8.868629196864182e-05,
"loss": 0.4264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3907405138015747,
"step": 565,
"valid_targets_mean": 4172.2,
"valid_targets_min": 961
},
{
"epoch": 1.7981072555205047,
"grad_norm": 0.3707666760898621,
"learning_rate": 8.848833145811976e-05,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4277447760105133,
"step": 570,
"valid_targets_mean": 3259.4,
"valid_targets_min": 1124
},
{
"epoch": 1.8138801261829653,
"grad_norm": 0.4062312243161753,
"learning_rate": 8.828887907088753e-05,
"loss": 0.4338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45710551738739014,
"step": 575,
"valid_targets_mean": 3280.9,
"valid_targets_min": 685
},
{
"epoch": 1.8296529968454258,
"grad_norm": 0.34345659850944893,
"learning_rate": 8.808794253807707e-05,
"loss": 0.4275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40221577882766724,
"step": 580,
"valid_targets_mean": 3658.1,
"valid_targets_min": 619
},
{
"epoch": 1.8454258675078865,
"grad_norm": 0.3330687260048639,
"learning_rate": 8.788552964834859e-05,
"loss": 0.4468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46073347330093384,
"step": 585,
"valid_targets_mean": 3980.0,
"valid_targets_min": 1109
},
{
"epoch": 1.861198738170347,
"grad_norm": 0.3397094597785125,
"learning_rate": 8.768164824758846e-05,
"loss": 0.4558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4085126221179962,
"step": 590,
"valid_targets_mean": 3243.0,
"valid_targets_min": 442
},
{
"epoch": 1.8769716088328074,
"grad_norm": 0.31999705156875274,
"learning_rate": 8.747630623860521e-05,
"loss": 0.4274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41694074869155884,
"step": 595,
"valid_targets_mean": 4215.4,
"valid_targets_min": 950
},
{
"epoch": 1.8927444794952681,
"grad_norm": 0.33040562917463656,
"learning_rate": 8.726951158082311e-05,
"loss": 0.4339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4324493408203125,
"step": 600,
"valid_targets_mean": 4159.7,
"valid_targets_min": 1175
},
{
"epoch": 1.9085173501577288,
"grad_norm": 0.36434921623211575,
"learning_rate": 8.706127228997376e-05,
"loss": 0.4539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4327438175678253,
"step": 605,
"valid_targets_mean": 3312.7,
"valid_targets_min": 1082
},
{
"epoch": 1.9242902208201893,
"grad_norm": 0.35804162946121054,
"learning_rate": 8.685159643778528e-05,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4164193272590637,
"step": 610,
"valid_targets_mean": 3273.8,
"valid_targets_min": 1083
},
{
"epoch": 1.9400630914826498,
"grad_norm": 0.3485498776902668,
"learning_rate": 8.664049215166955e-05,
"loss": 0.4606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5004233717918396,
"step": 615,
"valid_targets_mean": 4313.6,
"valid_targets_min": 856
},
{
"epoch": 1.9558359621451105,
"grad_norm": 0.3544861888530339,
"learning_rate": 8.6427967614407e-05,
"loss": 0.4387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4689190089702606,
"step": 620,
"valid_targets_mean": 3861.9,
"valid_targets_min": 1276
},
{
"epoch": 1.971608832807571,
"grad_norm": 0.35670645569674425,
"learning_rate": 8.621403106382968e-05,
"loss": 0.4398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4165767431259155,
"step": 625,
"valid_targets_mean": 3283.2,
"valid_targets_min": 1086
},
{
"epoch": 1.9873817034700316,
"grad_norm": 0.3739226579042923,
"learning_rate": 8.599869079250165e-05,
"loss": 0.4582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4649926424026489,
"step": 630,
"valid_targets_mean": 3385.2,
"valid_targets_min": 421
},
{
"epoch": 2.003154574132492,
"grad_norm": 0.4652236465790686,
"learning_rate": 8.578195514739784e-05,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3751116096973419,
"step": 635,
"valid_targets_mean": 3725.0,
"valid_targets_min": 1248
},
{
"epoch": 2.0189274447949526,
"grad_norm": 0.43822671559849474,
"learning_rate": 8.556383252958026e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3273969292640686,
"step": 640,
"valid_targets_mean": 3735.2,
"valid_targets_min": 835
},
{
"epoch": 2.034700315457413,
"grad_norm": 0.34010705122481344,
"learning_rate": 8.534433139387259e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3301159739494324,
"step": 645,
"valid_targets_mean": 4554.8,
"valid_targets_min": 1244
},
{
"epoch": 2.050473186119874,
"grad_norm": 0.3775080402751895,
"learning_rate": 8.512346024853219e-05,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3433346152305603,
"step": 650,
"valid_targets_mean": 3910.6,
"valid_targets_min": 1627
},
{
"epoch": 2.0662460567823344,
"grad_norm": 0.3728164026489659,
"learning_rate": 8.490122765492057e-05,
"loss": 0.3577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3310161828994751,
"step": 655,
"valid_targets_mean": 3759.2,
"valid_targets_min": 356
},
{
"epoch": 2.082018927444795,
"grad_norm": 0.37117967483663206,
"learning_rate": 8.467764222717136e-05,
"loss": 0.3287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32798779010772705,
"step": 660,
"valid_targets_mean": 3875.6,
"valid_targets_min": 918
},
{
"epoch": 2.0977917981072554,
"grad_norm": 0.41952911991741526,
"learning_rate": 8.445271263185646e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38159024715423584,
"step": 665,
"valid_targets_mean": 3336.3,
"valid_targets_min": 637
},
{
"epoch": 2.1135646687697163,
"grad_norm": 0.3661960517220788,
"learning_rate": 8.422644758765012e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3457246422767639,
"step": 670,
"valid_targets_mean": 4169.8,
"valid_targets_min": 1332
},
{
"epoch": 2.1293375394321767,
"grad_norm": 0.36231858184940324,
"learning_rate": 8.399885586499101e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32879745960235596,
"step": 675,
"valid_targets_mean": 4030.4,
"valid_targets_min": 687
},
{
"epoch": 2.145110410094637,
"grad_norm": 0.3744186649078691,
"learning_rate": 8.376994628574219e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3317606747150421,
"step": 680,
"valid_targets_mean": 4177.5,
"valid_targets_min": 763
},
{
"epoch": 2.1608832807570977,
"grad_norm": 0.401336910401923,
"learning_rate": 8.353972772284927e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34010061621665955,
"step": 685,
"valid_targets_mean": 3503.7,
"valid_targets_min": 1008
},
{
"epoch": 2.176656151419558,
"grad_norm": 0.38258080569669956,
"learning_rate": 8.330820909999633e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34190699458122253,
"step": 690,
"valid_targets_mean": 3343.3,
"valid_targets_min": 1412
},
{
"epoch": 2.192429022082019,
"grad_norm": 0.4079088718039198,
"learning_rate": 8.307539939126016e-05,
"loss": 0.3262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35490545630455017,
"step": 695,
"valid_targets_mean": 3479.4,
"valid_targets_min": 1019
},
{
"epoch": 2.2082018927444795,
"grad_norm": 0.3784901118731761,
"learning_rate": 8.284130762076235e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3070756793022156,
"step": 700,
"valid_targets_mean": 3581.0,
"valid_targets_min": 814
},
{
"epoch": 2.22397476340694,
"grad_norm": 0.3620067925312215,
"learning_rate": 8.260594286231947e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36078643798828125,
"step": 705,
"valid_targets_mean": 4102.9,
"valid_targets_min": 930
},
{
"epoch": 2.2397476340694005,
"grad_norm": 0.37855572907947915,
"learning_rate": 8.236931423909138e-05,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3413460850715637,
"step": 710,
"valid_targets_mean": 3942.3,
"valid_targets_min": 854
},
{
"epoch": 2.2555205047318614,
"grad_norm": 0.3736466247053816,
"learning_rate": 8.213143092322769e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37210655212402344,
"step": 715,
"valid_targets_mean": 3995.8,
"valid_targets_min": 999
},
{
"epoch": 2.271293375394322,
"grad_norm": 0.36249923496948544,
"learning_rate": 8.189230213551202e-05,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3457183837890625,
"step": 720,
"valid_targets_mean": 3800.2,
"valid_targets_min": 1066
},
{
"epoch": 2.2870662460567823,
"grad_norm": 0.39967218810071103,
"learning_rate": 8.165193714500481e-05,
"loss": 0.3593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37980931997299194,
"step": 725,
"valid_targets_mean": 3775.7,
"valid_targets_min": 711
},
{
"epoch": 2.302839116719243,
"grad_norm": 0.3735154397123298,
"learning_rate": 8.141034526868389e-05,
"loss": 0.3396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3548370599746704,
"step": 730,
"valid_targets_mean": 3849.8,
"valid_targets_min": 1156
},
{
"epoch": 2.3186119873817033,
"grad_norm": 0.33566493790874236,
"learning_rate": 8.116753587108339e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007664680480957,
"step": 735,
"valid_targets_mean": 4062.7,
"valid_targets_min": 753
},
{
"epoch": 2.334384858044164,
"grad_norm": 0.34171038668054404,
"learning_rate": 8.092351836393076e-05,
"loss": 0.3394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3267410397529602,
"step": 740,
"valid_targets_mean": 4180.0,
"valid_targets_min": 1298
},
{
"epoch": 2.3501577287066246,
"grad_norm": 0.4143460695405696,
"learning_rate": 8.067830220578191e-05,
"loss": 0.3717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3674328625202179,
"step": 745,
"valid_targets_mean": 3244.7,
"valid_targets_min": 841
},
{
"epoch": 2.365930599369085,
"grad_norm": 0.3698488243960478,
"learning_rate": 8.043189690165467e-05,
"loss": 0.3322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3374217450618744,
"step": 750,
"valid_targets_mean": 3789.4,
"valid_targets_min": 791
},
{
"epoch": 2.3817034700315456,
"grad_norm": 0.35690943739773573,
"learning_rate": 8.018431200266023e-05,
"loss": 0.3334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33900323510169983,
"step": 755,
"valid_targets_mean": 3827.4,
"valid_targets_min": 895
},
{
"epoch": 2.3974763406940065,
"grad_norm": 0.3850669222911541,
"learning_rate": 7.993555710563303e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33071190118789673,
"step": 760,
"valid_targets_mean": 3576.0,
"valid_targets_min": 843
},
{
"epoch": 2.413249211356467,
"grad_norm": 0.35558033307659687,
"learning_rate": 7.968564185275873e-05,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34395042061805725,
"step": 765,
"valid_targets_mean": 4245.2,
"valid_targets_min": 1665
},
{
"epoch": 2.4290220820189274,
"grad_norm": 0.3696713237256321,
"learning_rate": 7.943457593120045e-05,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3495572805404663,
"step": 770,
"valid_targets_mean": 3356.2,
"valid_targets_min": 976
},
{
"epoch": 2.444794952681388,
"grad_norm": 0.31257484242301387,
"learning_rate": 7.918236907272327e-05,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33376145362854004,
"step": 775,
"valid_targets_mean": 4976.2,
"valid_targets_min": 1063
},
{
"epoch": 2.4605678233438484,
"grad_norm": 0.3960160133368537,
"learning_rate": 7.892903105331712e-05,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35692280530929565,
"step": 780,
"valid_targets_mean": 3351.8,
"valid_targets_min": 238
},
{
"epoch": 2.4763406940063093,
"grad_norm": 0.4017364185807611,
"learning_rate": 7.867457169281765e-05,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34925976395606995,
"step": 785,
"valid_targets_mean": 3252.7,
"valid_targets_min": 1102
},
{
"epoch": 2.4921135646687698,
"grad_norm": 0.36347535237779893,
"learning_rate": 7.841900085452574e-05,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32482895255088806,
"step": 790,
"valid_targets_mean": 3577.0,
"valid_targets_min": 1141
},
{
"epoch": 2.5078864353312302,
"grad_norm": 0.3659525671502537,
"learning_rate": 7.816232844482516e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31454741954803467,
"step": 795,
"valid_targets_mean": 3475.5,
"valid_targets_min": 319
},
{
"epoch": 2.5236593059936907,
"grad_norm": 0.38262913290066447,
"learning_rate": 7.790456441279853e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33849939703941345,
"step": 800,
"valid_targets_mean": 3591.1,
"valid_targets_min": 380
},
{
"epoch": 2.5394321766561516,
"grad_norm": 0.3945192774714041,
"learning_rate": 7.764571874984174e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39895951747894287,
"step": 805,
"valid_targets_mean": 3441.2,
"valid_targets_min": 1072
},
{
"epoch": 2.555205047318612,
"grad_norm": 0.4103794578592908,
"learning_rate": 7.73858014892766e-05,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38766610622406006,
"step": 810,
"valid_targets_mean": 3518.4,
"valid_targets_min": 702
},
{
"epoch": 2.5709779179810726,
"grad_norm": 0.34204539742317147,
"learning_rate": 7.712482270596199e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32463714480400085,
"step": 815,
"valid_targets_mean": 3946.6,
"valid_targets_min": 982
},
{
"epoch": 2.586750788643533,
"grad_norm": 0.38589899224927104,
"learning_rate": 7.686279251590331e-05,
"loss": 0.3359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3244478702545166,
"step": 820,
"valid_targets_mean": 3312.8,
"valid_targets_min": 615
},
{
"epoch": 2.6025236593059935,
"grad_norm": 0.4052155719856952,
"learning_rate": 7.659972107586035e-05,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3753927946090698,
"step": 825,
"valid_targets_mean": 4110.9,
"valid_targets_min": 883
},
{
"epoch": 2.6182965299684544,
"grad_norm": 0.343927305431227,
"learning_rate": 7.633561858295364e-05,
"loss": 0.3614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36553817987442017,
"step": 830,
"valid_targets_mean": 4224.3,
"valid_targets_min": 1532
},
{
"epoch": 2.634069400630915,
"grad_norm": 0.37883054228512897,
"learning_rate": 7.607049527426916e-05,
"loss": 0.3531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33783310651779175,
"step": 835,
"valid_targets_mean": 3950.9,
"valid_targets_min": 604
},
{
"epoch": 2.6498422712933754,
"grad_norm": 0.37159620397410714,
"learning_rate": 7.580436142646155e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38431215286254883,
"step": 840,
"valid_targets_mean": 4062.4,
"valid_targets_min": 994
},
{
"epoch": 2.665615141955836,
"grad_norm": 0.355718961519934,
"learning_rate": 7.55372273553557e-05,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32091930508613586,
"step": 845,
"valid_targets_mean": 3696.0,
"valid_targets_min": 910
},
{
"epoch": 2.6813880126182967,
"grad_norm": 0.3361604204167694,
"learning_rate": 7.526910341554703e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34885716438293457,
"step": 850,
"valid_targets_mean": 4492.7,
"valid_targets_min": 1779
},
{
"epoch": 2.697160883280757,
"grad_norm": 0.366769390411755,
"learning_rate": 7.500000000000001e-05,
"loss": 0.351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33402395248413086,
"step": 855,
"valid_targets_mean": 3548.5,
"valid_targets_min": 1455
},
{
"epoch": 2.7129337539432177,
"grad_norm": 0.3691866466890524,
"learning_rate": 7.472992753964532e-05,
"loss": 0.3578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3604165017604828,
"step": 860,
"valid_targets_mean": 3894.6,
"valid_targets_min": 1009
},
{
"epoch": 2.728706624605678,
"grad_norm": 0.3289605476496754,
"learning_rate": 7.445889650297559e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3566170334815979,
"step": 865,
"valid_targets_mean": 4428.1,
"valid_targets_min": 1215
},
{
"epoch": 2.7444794952681386,
"grad_norm": 0.36697277963466485,
"learning_rate": 7.418691739563957e-05,
"loss": 0.3316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3522750735282898,
"step": 870,
"valid_targets_mean": 3775.8,
"valid_targets_min": 1260
},
{
"epoch": 2.7602523659305995,
"grad_norm": 0.37685217196788956,
"learning_rate": 7.391400076003492e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203175961971283,
"step": 875,
"valid_targets_mean": 3458.9,
"valid_targets_min": 650
},
{
"epoch": 2.77602523659306,
"grad_norm": 0.39105467876376565,
"learning_rate": 7.36401571748996e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3444768786430359,
"step": 880,
"valid_targets_mean": 3191.3,
"valid_targets_min": 898
},
{
"epoch": 2.7917981072555205,
"grad_norm": 0.3480244096566246,
"learning_rate": 7.336539725490178e-05,
"loss": 0.3664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34411507844924927,
"step": 885,
"valid_targets_mean": 4004.1,
"valid_targets_min": 843
},
{
"epoch": 2.807570977917981,
"grad_norm": 0.3827153845033614,
"learning_rate": 7.30897316502284e-05,
"loss": 0.3513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37474557757377625,
"step": 890,
"valid_targets_mean": 3213.1,
"valid_targets_min": 1265
},
{
"epoch": 2.823343848580442,
"grad_norm": 0.35019919394636845,
"learning_rate": 7.281317104617239e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3495219349861145,
"step": 895,
"valid_targets_mean": 3676.5,
"valid_targets_min": 839
},
{
"epoch": 2.8391167192429023,
"grad_norm": 0.3668968163187891,
"learning_rate": 7.253572616271844e-05,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3313937187194824,
"step": 900,
"valid_targets_mean": 3489.2,
"valid_targets_min": 1149
},
{
"epoch": 2.854889589905363,
"grad_norm": 0.35242471370100514,
"learning_rate": 7.225740775412751e-05,
"loss": 0.3455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32235974073410034,
"step": 905,
"valid_targets_mean": 4352.0,
"valid_targets_min": 1082
},
{
"epoch": 2.8706624605678233,
"grad_norm": 0.3664024727243619,
"learning_rate": 7.197822660851991e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3668972849845886,
"step": 910,
"valid_targets_mean": 4366.6,
"valid_targets_min": 335
},
{
"epoch": 2.8864353312302837,
"grad_norm": 0.3578280364539068,
"learning_rate": 7.169819354745725e-05,
"loss": 0.3552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3774711489677429,
"step": 915,
"valid_targets_mean": 3474.4,
"valid_targets_min": 902
},
{
"epoch": 2.9022082018927446,
"grad_norm": 0.39067610873109937,
"learning_rate": 7.141731942552288e-05,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37125909328460693,
"step": 920,
"valid_targets_mean": 3281.9,
"valid_targets_min": 1015
},
{
"epoch": 2.917981072555205,
"grad_norm": 0.36500287371289847,
"learning_rate": 7.113561512990119e-05,
"loss": 0.3568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34835952520370483,
"step": 925,
"valid_targets_mean": 3716.3,
"valid_targets_min": 648
},
{
"epoch": 2.9337539432176656,
"grad_norm": 0.3640542876272178,
"learning_rate": 7.085309157995557e-05,
"loss": 0.3656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35117635130882263,
"step": 930,
"valid_targets_mean": 3512.1,
"valid_targets_min": 937
},
{
"epoch": 2.949526813880126,
"grad_norm": 0.35850312668982054,
"learning_rate": 7.056975972680517e-05,
"loss": 0.3781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39214226603507996,
"step": 935,
"valid_targets_mean": 3744.8,
"valid_targets_min": 1098
},
{
"epoch": 2.965299684542587,
"grad_norm": 0.3355639560460545,
"learning_rate": 7.028563055290044e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3316793441772461,
"step": 940,
"valid_targets_mean": 4230.8,
"valid_targets_min": 1001
},
{
"epoch": 2.9810725552050474,
"grad_norm": 0.32982130499991974,
"learning_rate": 7.000071507159744e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32892876863479614,
"step": 945,
"valid_targets_mean": 4000.3,
"valid_targets_min": 1092
},
{
"epoch": 2.996845425867508,
"grad_norm": 0.34264280670103553,
"learning_rate": 6.971502432673085e-05,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32262521982192993,
"step": 950,
"valid_targets_mean": 3800.8,
"valid_targets_min": 1199
},
{
"epoch": 3.0126182965299684,
"grad_norm": 0.7097009281353539,
"learning_rate": 6.942856939218599e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25441882014274597,
"step": 955,
"valid_targets_mean": 3380.2,
"valid_targets_min": 937
},
{
"epoch": 3.028391167192429,
"grad_norm": 0.4141083590950299,
"learning_rate": 6.914136137146951e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23335978388786316,
"step": 960,
"valid_targets_mean": 4133.7,
"valid_targets_min": 744
},
{
"epoch": 3.0441640378548898,
"grad_norm": 0.46856537273414334,
"learning_rate": 6.885341139727912e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24540895223617554,
"step": 965,
"valid_targets_mean": 3925.4,
"valid_targets_min": 984
},
{
"epoch": 3.0599369085173502,
"grad_norm": 0.4418748358978105,
"learning_rate": 6.856473063107187e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26762479543685913,
"step": 970,
"valid_targets_mean": 3725.4,
"valid_targets_min": 728
},
{
"epoch": 3.0757097791798107,
"grad_norm": 0.43206699700017354,
"learning_rate": 6.827533026263169e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2583632469177246,
"step": 975,
"valid_targets_mean": 3629.8,
"valid_targets_min": 934
},
{
"epoch": 3.091482649842271,
"grad_norm": 0.3617975005945939,
"learning_rate": 6.798522150963552e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22357064485549927,
"step": 980,
"valid_targets_mean": 4364.8,
"valid_targets_min": 658
},
{
"epoch": 3.107255520504732,
"grad_norm": 0.38710853094314396,
"learning_rate": 6.769441561721863e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311776876449585,
"step": 985,
"valid_targets_mean": 4206.0,
"valid_targets_min": 752
},
{
"epoch": 3.1230283911671926,
"grad_norm": 0.38654625221316713,
"learning_rate": 6.740292385753858e-05,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2150537222623825,
"step": 990,
"valid_targets_mean": 3844.5,
"valid_targets_min": 737
},
{
"epoch": 3.138801261829653,
"grad_norm": 0.6526308811071234,
"learning_rate": 6.711075752933847e-05,
"loss": 0.2383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2665025591850281,
"step": 995,
"valid_targets_mean": 3494.9,
"valid_targets_min": 1070
},
{
"epoch": 3.1545741324921135,
"grad_norm": 0.4166111698553452,
"learning_rate": 6.681792795750875e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24555368721485138,
"step": 1000,
"valid_targets_mean": 4494.4,
"valid_targets_min": 1261
},
{
"epoch": 3.170347003154574,
"grad_norm": 0.3792621220742212,
"learning_rate": 6.652444649264856e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24369245767593384,
"step": 1005,
"valid_targets_mean": 4548.4,
"valid_targets_min": 1186
},
{
"epoch": 3.186119873817035,
"grad_norm": 0.45428146737608754,
"learning_rate": 6.623032451062542e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21560588479042053,
"step": 1010,
"valid_targets_mean": 2806.8,
"valid_targets_min": 700
},
{
"epoch": 3.2018927444794953,
"grad_norm": 0.4396918249543382,
"learning_rate": 6.593557341213457e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22254452109336853,
"step": 1015,
"valid_targets_mean": 2975.2,
"valid_targets_min": 671
},
{
"epoch": 3.217665615141956,
"grad_norm": 0.42749423096915035,
"learning_rate": 6.564020462225679e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2484319508075714,
"step": 1020,
"valid_targets_mean": 3568.7,
"valid_targets_min": 843
},
{
"epoch": 3.2334384858044163,
"grad_norm": 0.39159517401747657,
"learning_rate": 6.534422959001585e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22285829484462738,
"step": 1025,
"valid_targets_mean": 3964.2,
"valid_targets_min": 1164
},
{
"epoch": 3.249211356466877,
"grad_norm": 0.4291962426431375,
"learning_rate": 6.504765978793443e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27856796979904175,
"step": 1030,
"valid_targets_mean": 4023.6,
"valid_targets_min": 1201
},
{
"epoch": 3.2649842271293377,
"grad_norm": 0.4450053564657277,
"learning_rate": 6.475050671158961e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21933044493198395,
"step": 1035,
"valid_targets_mean": 3322.5,
"valid_targets_min": 865
},
{
"epoch": 3.280757097791798,
"grad_norm": 0.43034585118259266,
"learning_rate": 6.445278187916722e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606717050075531,
"step": 1040,
"valid_targets_mean": 3505.2,
"valid_targets_min": 746
},
{
"epoch": 3.2965299684542586,
"grad_norm": 0.37410333228585696,
"learning_rate": 6.415449683101537e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2275415062904358,
"step": 1045,
"valid_targets_mean": 4542.5,
"valid_targets_min": 1215
},
{
"epoch": 3.312302839116719,
"grad_norm": 0.40963729012232886,
"learning_rate": 6.385566312919716e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20051081478595734,
"step": 1050,
"valid_targets_mean": 3469.5,
"valid_targets_min": 779
},
{
"epoch": 3.32807570977918,
"grad_norm": 0.4396800514108122,
"learning_rate": 6.355629235704248e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2249513864517212,
"step": 1055,
"valid_targets_mean": 3372.2,
"valid_targets_min": 889
},
{
"epoch": 3.3438485804416405,
"grad_norm": 0.3906571239789868,
"learning_rate": 6.3256396118699e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2390715628862381,
"step": 1060,
"valid_targets_mean": 4076.8,
"valid_targets_min": 700
},
{
"epoch": 3.359621451104101,
"grad_norm": 0.4207281200709271,
"learning_rate": 6.295598603868246e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26639336347579956,
"step": 1065,
"valid_targets_mean": 4140.6,
"valid_targets_min": 991
},
{
"epoch": 3.3753943217665614,
"grad_norm": 0.41411028120988236,
"learning_rate": 6.265507376142594e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24677228927612305,
"step": 1070,
"valid_targets_mean": 3294.0,
"valid_targets_min": 1005
},
{
"epoch": 3.3911671924290223,
"grad_norm": 0.4574462947352491,
"learning_rate": 6.235367095082867e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24753236770629883,
"step": 1075,
"valid_targets_mean": 3098.3,
"valid_targets_min": 883
},
{
"epoch": 3.406940063091483,
"grad_norm": 0.44568583062116435,
"learning_rate": 6.205178928980377e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23697753250598907,
"step": 1080,
"valid_targets_mean": 3348.2,
"valid_targets_min": 676
},
{
"epoch": 3.4227129337539433,
"grad_norm": 0.40272251602889164,
"learning_rate": 6.174944047982549e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23433184623718262,
"step": 1085,
"valid_targets_mean": 3644.0,
"valid_targets_min": 1339
},
{
"epoch": 3.4384858044164037,
"grad_norm": 0.43918368499686794,
"learning_rate": 6.144663624047564e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24812614917755127,
"step": 1090,
"valid_targets_mean": 3482.3,
"valid_targets_min": 749
},
{
"epoch": 3.454258675078864,
"grad_norm": 0.4228096716595015,
"learning_rate": 6.114338830898922e-05,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24244436621665955,
"step": 1095,
"valid_targets_mean": 3178.1,
"valid_targets_min": 825
},
{
"epoch": 3.470031545741325,
"grad_norm": 0.39163077627657583,
"learning_rate": 6.083970843979957e-05,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23379601538181305,
"step": 1100,
"valid_targets_mean": 3980.8,
"valid_targets_min": 494
},
{
"epoch": 3.4858044164037856,
"grad_norm": 0.4328683495707631,
"learning_rate": 6.0535608404082724e-05,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863377332687378,
"step": 1105,
"valid_targets_mean": 3707.3,
"valid_targets_min": 619
},
{
"epoch": 3.501577287066246,
"grad_norm": 0.4102684667021291,
"learning_rate": 6.0231099989301086e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2362220287322998,
"step": 1110,
"valid_targets_mean": 3817.2,
"valid_targets_min": 421
},
{
"epoch": 3.5173501577287065,
"grad_norm": 0.4640832182484784,
"learning_rate": 5.9926194998746624e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24722759425640106,
"step": 1115,
"valid_targets_mean": 2821.9,
"valid_targets_min": 701
},
{
"epoch": 3.5331230283911674,
"grad_norm": 0.4214315372040873,
"learning_rate": 5.9620905251083196e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25116032361984253,
"step": 1120,
"valid_targets_mean": 4028.2,
"valid_targets_min": 1224
},
{
"epoch": 3.548895899053628,
"grad_norm": 0.4050858811434479,
"learning_rate": 5.931524257988864e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557201087474823,
"step": 1125,
"valid_targets_mean": 3980.5,
"valid_targets_min": 762
},
{
"epoch": 3.5646687697160884,
"grad_norm": 0.406660075884935,
"learning_rate": 5.900921883319591e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23852787911891937,
"step": 1130,
"valid_targets_mean": 4305.7,
"valid_targets_min": 702
},
{
"epoch": 3.580441640378549,
"grad_norm": 0.38441971141571263,
"learning_rate": 5.870284587303394e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21825431287288666,
"step": 1135,
"valid_targets_mean": 3953.8,
"valid_targets_min": 1109
},
{
"epoch": 3.5962145110410093,
"grad_norm": 0.43559756325600296,
"learning_rate": 5.839613557496776e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2443239539861679,
"step": 1140,
"valid_targets_mean": 3330.1,
"valid_targets_min": 742
},
{
"epoch": 3.61198738170347,
"grad_norm": 0.4144684042912617,
"learning_rate": 5.808909982763825e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2617552876472473,
"step": 1145,
"valid_targets_mean": 3567.0,
"valid_targets_min": 676
},
{
"epoch": 3.6277602523659307,
"grad_norm": 0.41419953192389397,
"learning_rate": 5.778175053230126e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2499631643295288,
"step": 1150,
"valid_targets_mean": 3682.4,
"valid_targets_min": 592
},
{
"epoch": 3.643533123028391,
"grad_norm": 0.4248863441860044,
"learning_rate": 5.747409960236637e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2362518310546875,
"step": 1155,
"valid_targets_mean": 3552.7,
"valid_targets_min": 840
},
{
"epoch": 3.6593059936908516,
"grad_norm": 0.4077084205643721,
"learning_rate": 5.716615896293501e-05,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23393303155899048,
"step": 1160,
"valid_targets_mean": 3526.3,
"valid_targets_min": 753
},
{
"epoch": 3.6750788643533125,
"grad_norm": 0.42649978051773413,
"learning_rate": 5.68579405503383e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21634435653686523,
"step": 1165,
"valid_targets_mean": 3465.7,
"valid_targets_min": 319
},
{
"epoch": 3.690851735015773,
"grad_norm": 0.40336913679264713,
"learning_rate": 5.654945631167433e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26242315769195557,
"step": 1170,
"valid_targets_mean": 4229.9,
"valid_targets_min": 1083
},
{
"epoch": 3.7066246056782335,
"grad_norm": 0.3665963077273498,
"learning_rate": 5.624071820434508e-05,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2064288854598999,
"step": 1175,
"valid_targets_mean": 4215.2,
"valid_targets_min": 1362
},
{
"epoch": 3.722397476340694,
"grad_norm": 0.3999997884440537,
"learning_rate": 5.593173819559294e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22290341556072235,
"step": 1180,
"valid_targets_mean": 3652.1,
"valid_targets_min": 635
},
{
"epoch": 3.7381703470031544,
"grad_norm": 0.3557096871710355,
"learning_rate": 5.562252826203687e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22109612822532654,
"step": 1185,
"valid_targets_mean": 4395.5,
"valid_targets_min": 513
},
{
"epoch": 3.753943217665615,
"grad_norm": 0.431122095793743,
"learning_rate": 5.531310038920805e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2331051081418991,
"step": 1190,
"valid_targets_mean": 3222.1,
"valid_targets_min": 1243
},
{
"epoch": 3.769716088328076,
"grad_norm": 0.3880204576004606,
"learning_rate": 5.500346657108545e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2325371503829956,
"step": 1195,
"valid_targets_mean": 3813.5,
"valid_targets_min": 925
},
{
"epoch": 3.7854889589905363,
"grad_norm": 0.44598651479849705,
"learning_rate": 5.469363880963082e-05,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24427175521850586,
"step": 1200,
"valid_targets_mean": 3289.9,
"valid_targets_min": 751
},
{
"epoch": 3.8012618296529967,
"grad_norm": 0.3931285059362459,
"learning_rate": 5.438362911432347e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2518792152404785,
"step": 1205,
"valid_targets_mean": 4406.3,
"valid_targets_min": 1046
},
{
"epoch": 3.8170347003154577,
"grad_norm": 0.4035669817262566,
"learning_rate": 5.407344950169486e-05,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2715667188167572,
"step": 1210,
"valid_targets_mean": 4231.5,
"valid_targets_min": 941
},
{
"epoch": 3.832807570977918,
"grad_norm": 0.3957915259954298,
"learning_rate": 5.376311199486268e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23946471512317657,
"step": 1215,
"valid_targets_mean": 3859.7,
"valid_targets_min": 734
},
{
"epoch": 3.8485804416403786,
"grad_norm": 0.383172680689461,
"learning_rate": 5.3452628623064934e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22085560858249664,
"step": 1220,
"valid_targets_mean": 3614.2,
"valid_targets_min": 955
},
{
"epoch": 3.864353312302839,
"grad_norm": 0.36385693259713353,
"learning_rate": 5.31420114211936e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2752317488193512,
"step": 1225,
"valid_targets_mean": 4839.8,
"valid_targets_min": 1679
},
{
"epoch": 3.8801261829652995,
"grad_norm": 0.370531037509034,
"learning_rate": 5.2831272429328116e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20723074674606323,
"step": 1230,
"valid_targets_mean": 3841.6,
"valid_targets_min": 238
},
{
"epoch": 3.89589905362776,
"grad_norm": 0.4465487481114569,
"learning_rate": 5.2520423692268775e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2362392246723175,
"step": 1235,
"valid_targets_mean": 2908.7,
"valid_targets_min": 759
},
{
"epoch": 3.911671924290221,
"grad_norm": 0.40183616151013524,
"learning_rate": 5.220947725906975e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23403562605381012,
"step": 1240,
"valid_targets_mean": 4062.1,
"valid_targets_min": 794
},
{
"epoch": 3.9274447949526814,
"grad_norm": 0.36720727944432746,
"learning_rate": 5.18984451825721e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2156575322151184,
"step": 1245,
"valid_targets_mean": 4244.2,
"valid_targets_min": 1346
},
{
"epoch": 3.943217665615142,
"grad_norm": 0.36739318896142137,
"learning_rate": 5.1587339518936585e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23408517241477966,
"step": 1250,
"valid_targets_mean": 4298.3,
"valid_targets_min": 751
},
{
"epoch": 3.958990536277603,
"grad_norm": 0.38433498745772443,
"learning_rate": 5.127617232717631e-05,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26561039686203003,
"step": 1255,
"valid_targets_mean": 4233.7,
"valid_targets_min": 780
},
{
"epoch": 3.9747634069400632,
"grad_norm": 0.417328324144264,
"learning_rate": 5.096495566868935e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26622718572616577,
"step": 1260,
"valid_targets_mean": 3380.5,
"valid_targets_min": 1257
},
{
"epoch": 3.9905362776025237,
"grad_norm": 0.40583456982881966,
"learning_rate": 5.065370160679115e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2431681752204895,
"step": 1265,
"valid_targets_mean": 3864.8,
"valid_targets_min": 899
},
{
"epoch": 4.006309148264984,
"grad_norm": 0.4821387411125082,
"learning_rate": 5.034242220624706e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15413779020309448,
"step": 1270,
"valid_targets_mean": 3352.2,
"valid_targets_min": 830
},
{
"epoch": 4.022082018927445,
"grad_norm": 0.5507076000324466,
"learning_rate": 5.003112953280452e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13071414828300476,
"step": 1275,
"valid_targets_mean": 3422.1,
"valid_targets_min": 869
},
{
"epoch": 4.037854889589905,
"grad_norm": 0.4613969580120687,
"learning_rate": 4.971983565272553e-05,
"loss": 0.1438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12674719095230103,
"step": 1280,
"valid_targets_mean": 2750.3,
"valid_targets_min": 994
},
{
"epoch": 4.053627760252366,
"grad_norm": 0.4152583203563749,
"learning_rate": 4.940855263231873e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1208362877368927,
"step": 1285,
"valid_targets_mean": 3728.6,
"valid_targets_min": 961
},
{
"epoch": 4.069400630914826,
"grad_norm": 0.4482984088898629,
"learning_rate": 4.909729253747197e-05,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1652022749185562,
"step": 1290,
"valid_targets_mean": 3619.0,
"valid_targets_min": 1439
},
{
"epoch": 4.085173501577287,
"grad_norm": 0.399726958950638,
"learning_rate": 4.878606743318439e-05,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11733722686767578,
"step": 1295,
"valid_targets_mean": 3720.7,
"valid_targets_min": 980
},
{
"epoch": 4.100946372239748,
"grad_norm": 0.46687530262082305,
"learning_rate": 4.8474889383098855e-05,
"loss": 0.1452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1552787721157074,
"step": 1300,
"valid_targets_mean": 3531.9,
"valid_targets_min": 549
},
{
"epoch": 4.116719242902208,
"grad_norm": 0.4162751106492577,
"learning_rate": 4.816377044903428e-05,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12626974284648895,
"step": 1305,
"valid_targets_mean": 4288.3,
"valid_targets_min": 1040
},
{
"epoch": 4.132492113564669,
"grad_norm": 0.49835621727107526,
"learning_rate": 4.7852722690518196e-05,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440780758857727,
"step": 1310,
"valid_targets_mean": 2622.8,
"valid_targets_min": 715
},
{
"epoch": 4.148264984227129,
"grad_norm": 0.43297110173064957,
"learning_rate": 4.75417581643192e-05,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14077317714691162,
"step": 1315,
"valid_targets_mean": 3629.1,
"valid_targets_min": 809
},
{
"epoch": 4.16403785488959,
"grad_norm": 0.4263831486425033,
"learning_rate": 4.723088892397968e-05,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13717670738697052,
"step": 1320,
"valid_targets_mean": 3560.4,
"valid_targets_min": 762
},
{
"epoch": 4.17981072555205,
"grad_norm": 0.40962122241683374,
"learning_rate": 4.6920127019348556e-05,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14324375987052917,
"step": 1325,
"valid_targets_mean": 4316.1,
"valid_targets_min": 1018
},
{
"epoch": 4.195583596214511,
"grad_norm": 0.39674021617148886,
"learning_rate": 4.6609484496114256e-05,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13059474527835846,
"step": 1330,
"valid_targets_mean": 4042.8,
"valid_targets_min": 356
},
{
"epoch": 4.211356466876971,
"grad_norm": 0.42194240284178985,
"learning_rate": 4.629897339533771e-05,
"loss": 0.1371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11975990235805511,
"step": 1335,
"valid_targets_mean": 3509.7,
"valid_targets_min": 622
},
{
"epoch": 4.2271293375394325,
"grad_norm": 0.4348331012114048,
"learning_rate": 4.598860575298575e-05,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14041069149971008,
"step": 1340,
"valid_targets_mean": 3980.3,
"valid_targets_min": 952
},
{
"epoch": 4.242902208201893,
"grad_norm": 0.47949363282852,
"learning_rate": 4.5678393599464435e-05,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18775832653045654,
"step": 1345,
"valid_targets_mean": 3573.2,
"valid_targets_min": 650
},
{
"epoch": 4.2586750788643535,
"grad_norm": 0.42941461444596235,
"learning_rate": 4.5368348959152864e-05,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13734444975852966,
"step": 1350,
"valid_targets_mean": 3916.9,
"valid_targets_min": 756
},
{
"epoch": 4.274447949526814,
"grad_norm": 0.4550660502056618,
"learning_rate": 4.505848384993696e-05,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1418776959180832,
"step": 1355,
"valid_targets_mean": 3606.0,
"valid_targets_min": 815
},
{
"epoch": 4.290220820189274,
"grad_norm": 0.4330817089869141,
"learning_rate": 4.474881028274375e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1301407814025879,
"step": 1360,
"valid_targets_mean": 3551.2,
"valid_targets_min": 782
},
{
"epoch": 4.305993690851735,
"grad_norm": 0.414328135805903,
"learning_rate": 4.4439340261075716e-05,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14358800649642944,
"step": 1365,
"valid_targets_mean": 3952.6,
"valid_targets_min": 1010
},
{
"epoch": 4.321766561514195,
"grad_norm": 0.3935072929678093,
"learning_rate": 4.413008578054558e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1338864117860794,
"step": 1370,
"valid_targets_mean": 4548.4,
"valid_targets_min": 1340
},
{
"epoch": 4.337539432176656,
"grad_norm": 0.43902808024930545,
"learning_rate": 4.3821058828411244e-05,
"loss": 0.1408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14350779354572296,
"step": 1375,
"valid_targets_mean": 3322.0,
"valid_targets_min": 1092
},
{
"epoch": 4.353312302839116,
"grad_norm": 0.47832433617177983,
"learning_rate": 4.35122713831113e-05,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16027812659740448,
"step": 1380,
"valid_targets_mean": 3451.2,
"valid_targets_min": 654
},
{
"epoch": 4.369085173501578,
"grad_norm": 0.3780995897403291,
"learning_rate": 4.320373541380054e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1329713761806488,
"step": 1385,
"valid_targets_mean": 4768.9,
"valid_targets_min": 374
},
{
"epoch": 4.384858044164038,
"grad_norm": 0.41367517391687664,
"learning_rate": 4.289546287988614e-05,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14861229062080383,
"step": 1390,
"valid_targets_mean": 4518.6,
"valid_targets_min": 1142
},
{
"epoch": 4.400630914826499,
"grad_norm": 0.38660135861653716,
"learning_rate": 4.258746573056401e-05,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13534846901893616,
"step": 1395,
"valid_targets_mean": 4576.8,
"valid_targets_min": 1064
},
{
"epoch": 4.416403785488959,
"grad_norm": 0.43614094592909824,
"learning_rate": 4.2279755904355704e-05,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16031000018119812,
"step": 1400,
"valid_targets_mean": 4019.5,
"valid_targets_min": 765
},
{
"epoch": 4.4321766561514195,
"grad_norm": 0.4121639292417491,
"learning_rate": 4.197234532864558e-05,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1366066038608551,
"step": 1405,
"valid_targets_mean": 3927.2,
"valid_targets_min": 789
},
{
"epoch": 4.44794952681388,
"grad_norm": 0.46001162500530945,
"learning_rate": 4.1665245919218544e-05,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16069738566875458,
"step": 1410,
"valid_targets_mean": 3374.1,
"valid_targets_min": 1130
},
{
"epoch": 4.4637223974763405,
"grad_norm": 0.4415524300689523,
"learning_rate": 4.135846957979811e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14812339842319489,
"step": 1415,
"valid_targets_mean": 3858.5,
"valid_targets_min": 976
},
{
"epoch": 4.479495268138801,
"grad_norm": 0.41572746327510646,
"learning_rate": 4.105202820158503e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14529840648174286,
"step": 1420,
"valid_targets_mean": 4642.3,
"valid_targets_min": 1302
},
{
"epoch": 4.495268138801261,
"grad_norm": 0.40567170422574816,
"learning_rate": 4.074593366279636e-05,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11761084198951721,
"step": 1425,
"valid_targets_mean": 3919.9,
"valid_targets_min": 841
},
{
"epoch": 4.511041009463723,
"grad_norm": 0.43551327648741345,
"learning_rate": 4.044019782820505e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16616562008857727,
"step": 1430,
"valid_targets_mean": 3753.2,
"valid_targets_min": 899
},
{
"epoch": 4.526813880126183,
"grad_norm": 0.4304253714649899,
"learning_rate": 4.0134832548680006e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14028897881507874,
"step": 1435,
"valid_targets_mean": 3892.4,
"valid_targets_min": 981
},
{
"epoch": 4.542586750788644,
"grad_norm": 0.4300902798658754,
"learning_rate": 3.982984966072677e-05,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14914816617965698,
"step": 1440,
"valid_targets_mean": 3653.2,
"valid_targets_min": 982
},
{
"epoch": 4.558359621451104,
"grad_norm": 0.4657374621310647,
"learning_rate": 3.952526098602873e-05,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14326679706573486,
"step": 1445,
"valid_targets_mean": 3503.7,
"valid_targets_min": 1060
},
{
"epoch": 4.574132492113565,
"grad_norm": 0.43365046360826953,
"learning_rate": 3.9221078330988806e-05,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13995081186294556,
"step": 1450,
"valid_targets_mean": 3612.9,
"valid_targets_min": 1266
},
{
"epoch": 4.589905362776025,
"grad_norm": 0.4727320068947522,
"learning_rate": 3.89173134862719e-05,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1454961597919464,
"step": 1455,
"valid_targets_mean": 3642.2,
"valid_targets_min": 582
},
{
"epoch": 4.605678233438486,
"grad_norm": 0.4414031361451162,
"learning_rate": 3.861397822634784e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15584497153759003,
"step": 1460,
"valid_targets_mean": 3764.9,
"valid_targets_min": 1082
},
{
"epoch": 4.621451104100946,
"grad_norm": 0.41187705436552824,
"learning_rate": 3.831108430903494e-05,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14060024917125702,
"step": 1465,
"valid_targets_mean": 4490.7,
"valid_targets_min": 790
},
{
"epoch": 4.6372239747634065,
"grad_norm": 0.43315410457939646,
"learning_rate": 3.800864347504437e-05,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14828018844127655,
"step": 1470,
"valid_targets_mean": 3756.7,
"valid_targets_min": 895
},
{
"epoch": 4.652996845425868,
"grad_norm": 0.4315038585680116,
"learning_rate": 3.7706667447524876e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16025035083293915,
"step": 1475,
"valid_targets_mean": 3776.8,
"valid_targets_min": 757
},
{
"epoch": 4.668769716088328,
"grad_norm": 0.4629700901684569,
"learning_rate": 3.740516793160855e-05,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1619722992181778,
"step": 1480,
"valid_targets_mean": 3953.1,
"valid_targets_min": 1047
},
{
"epoch": 4.684542586750789,
"grad_norm": 0.4506448009518266,
"learning_rate": 3.710415661395699e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594841182231903,
"step": 1485,
"valid_targets_mean": 3689.6,
"valid_targets_min": 604
},
{
"epoch": 4.700315457413249,
"grad_norm": 0.4595891610524585,
"learning_rate": 3.6803645162308376e-05,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17818719148635864,
"step": 1490,
"valid_targets_mean": 3929.1,
"valid_targets_min": 940
},
{
"epoch": 4.71608832807571,
"grad_norm": 0.4150467966875533,
"learning_rate": 3.6503645225025175e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16535528004169464,
"step": 1495,
"valid_targets_mean": 4194.8,
"valid_targets_min": 791
},
{
"epoch": 4.73186119873817,
"grad_norm": 0.4061399055435858,
"learning_rate": 3.620416843064266e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13359515368938446,
"step": 1500,
"valid_targets_mean": 4139.6,
"valid_targets_min": 676
},
{
"epoch": 4.747634069400631,
"grad_norm": 0.4132881612276861,
"learning_rate": 3.5905226387418126e-05,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1458536684513092,
"step": 1505,
"valid_targets_mean": 3785.9,
"valid_targets_min": 648
},
{
"epoch": 4.763406940063091,
"grad_norm": 0.4882855781127496,
"learning_rate": 3.5606830682880965e-05,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18403048813343048,
"step": 1510,
"valid_targets_mean": 3238.6,
"valid_targets_min": 700
},
{
"epoch": 4.779179810725552,
"grad_norm": 0.48302912366147344,
"learning_rate": 3.530899288338352e-05,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15412986278533936,
"step": 1515,
"valid_targets_mean": 3244.3,
"valid_targets_min": 693
},
{
"epoch": 4.794952681388013,
"grad_norm": 0.41004786154940126,
"learning_rate": 3.501172453365268e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13483601808547974,
"step": 1520,
"valid_targets_mean": 4170.5,
"valid_targets_min": 1177
},
{
"epoch": 4.8107255520504735,
"grad_norm": 0.4225330709889332,
"learning_rate": 3.471503715634252e-05,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14184939861297607,
"step": 1525,
"valid_targets_mean": 3843.4,
"valid_targets_min": 731
},
{
"epoch": 4.826498422712934,
"grad_norm": 0.37596497087636227,
"learning_rate": 3.44189422515875e-05,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15294434130191803,
"step": 1530,
"valid_targets_mean": 4488.2,
"valid_targets_min": 801
},
{
"epoch": 4.842271293375394,
"grad_norm": 0.38087264895160944,
"learning_rate": 3.4123451296556845e-05,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13751477003097534,
"step": 1535,
"valid_targets_mean": 4411.7,
"valid_targets_min": 337
},
{
"epoch": 4.858044164037855,
"grad_norm": 0.39361476642320653,
"learning_rate": 3.382857574500957e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13432013988494873,
"step": 1540,
"valid_targets_mean": 4315.6,
"valid_targets_min": 1197
},
{
"epoch": 4.873817034700315,
"grad_norm": 0.42718530839186636,
"learning_rate": 3.3534327026850574e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16855821013450623,
"step": 1545,
"valid_targets_mean": 4262.7,
"valid_targets_min": 635
},
{
"epoch": 4.889589905362776,
"grad_norm": 0.3917349041475647,
"learning_rate": 3.324071654768754e-05,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1179637610912323,
"step": 1550,
"valid_targets_mean": 3897.3,
"valid_targets_min": 730
},
{
"epoch": 4.905362776025236,
"grad_norm": 0.4466560221892044,
"learning_rate": 3.2947755688388874e-05,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13815364241600037,
"step": 1555,
"valid_targets_mean": 3516.4,
"valid_targets_min": 641
},
{
"epoch": 4.921135646687697,
"grad_norm": 0.4240920687523467,
"learning_rate": 3.26554558046426e-05,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13758045434951782,
"step": 1560,
"valid_targets_mean": 4800.1,
"valid_targets_min": 666
},
{
"epoch": 4.936908517350158,
"grad_norm": 0.39942977491928344,
"learning_rate": 3.236382822651606e-05,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12246360629796982,
"step": 1565,
"valid_targets_mean": 3751.0,
"valid_targets_min": 380
},
{
"epoch": 4.952681388012619,
"grad_norm": 0.40923515884045225,
"learning_rate": 3.207288425801689e-05,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13511720299720764,
"step": 1570,
"valid_targets_mean": 4188.2,
"valid_targets_min": 1496
},
{
"epoch": 4.968454258675079,
"grad_norm": 0.47290889467879393,
"learning_rate": 3.1782635176654764e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17075365781784058,
"step": 1575,
"valid_targets_mean": 3425.8,
"valid_targets_min": 747
},
{
"epoch": 4.9842271293375395,
"grad_norm": 0.44727850590756046,
"learning_rate": 3.149309223300428e-05,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16327592730522156,
"step": 1580,
"valid_targets_mean": 3940.4,
"valid_targets_min": 1439
},
{
"epoch": 5.0,
"grad_norm": 0.4095300324275936,
"learning_rate": 3.120426665026891e-05,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14301863312721252,
"step": 1585,
"valid_targets_mean": 3949.0,
"valid_targets_min": 776
},
{
"epoch": 5.0157728706624605,
"grad_norm": 0.4965073217628422,
"learning_rate": 3.091616962384587e-05,
"loss": 0.0813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06953192502260208,
"step": 1590,
"valid_targets_mean": 3511.0,
"valid_targets_min": 421
},
{
"epoch": 5.031545741324921,
"grad_norm": 0.39829247464224404,
"learning_rate": 3.06288123208923e-05,
"loss": 0.0813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07943619787693024,
"step": 1595,
"valid_targets_mean": 3653.5,
"valid_targets_min": 790
},
{
"epoch": 5.047318611987381,
"grad_norm": 0.36709273418268795,
"learning_rate": 3.034220587989226e-05,
"loss": 0.0785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0734889879822731,
"step": 1600,
"valid_targets_mean": 4551.4,
"valid_targets_min": 757
},
{
"epoch": 5.063091482649842,
"grad_norm": 0.46061848051569354,
"learning_rate": 3.005636141022512e-05,
"loss": 0.0806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09356047958135605,
"step": 1605,
"valid_targets_mean": 4240.9,
"valid_targets_min": 1133
},
{
"epoch": 5.078864353312303,
"grad_norm": 0.3863919471144128,
"learning_rate": 2.977128999173482e-05,
"loss": 0.0793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07880861312150955,
"step": 1610,
"valid_targets_mean": 4272.3,
"valid_targets_min": 961
},
{
"epoch": 5.094637223974764,
"grad_norm": 0.4006873478397203,
"learning_rate": 2.948700267430049e-05,
"loss": 0.0754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07071110606193542,
"step": 1615,
"valid_targets_mean": 3531.6,
"valid_targets_min": 676
},
{
"epoch": 5.110410094637224,
"grad_norm": 0.35708727468781015,
"learning_rate": 2.920351047740808e-05,
"loss": 0.0773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07418598234653473,
"step": 1620,
"valid_targets_mean": 4278.7,
"valid_targets_min": 909
},
{
"epoch": 5.126182965299685,
"grad_norm": 0.36066950208005905,
"learning_rate": 2.892082438972325e-05,
"loss": 0.0854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07705340534448624,
"step": 1625,
"valid_targets_mean": 4657.5,
"valid_targets_min": 1511
},
{
"epoch": 5.141955835962145,
"grad_norm": 0.3755353448825496,
"learning_rate": 2.863895536866541e-05,
"loss": 0.0779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0808149129152298,
"step": 1630,
"valid_targets_mean": 4137.3,
"valid_targets_min": 951
},
{
"epoch": 5.157728706624606,
"grad_norm": 0.38944321711541496,
"learning_rate": 2.835791433998301e-05,
"loss": 0.084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07152563333511353,
"step": 1635,
"valid_targets_mean": 3748.3,
"valid_targets_min": 714
},
{
"epoch": 5.173501577287066,
"grad_norm": 0.3859159269519384,
"learning_rate": 2.807771219733004e-05,
"loss": 0.0783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07155505567789078,
"step": 1640,
"valid_targets_mean": 4150.2,
"valid_targets_min": 1198
},
{
"epoch": 5.1892744479495265,
"grad_norm": 0.40877023575458493,
"learning_rate": 2.7798359801843766e-05,
"loss": 0.0764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07761353999376297,
"step": 1645,
"valid_targets_mean": 3865.1,
"valid_targets_min": 1006
},
{
"epoch": 5.205047318611987,
"grad_norm": 0.4307421685519268,
"learning_rate": 2.7519867981723712e-05,
"loss": 0.0811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0829286277294159,
"step": 1650,
"valid_targets_mean": 3674.1,
"valid_targets_min": 875
},
{
"epoch": 5.220820189274448,
"grad_norm": 0.3970534191384527,
"learning_rate": 2.724224753181197e-05,
"loss": 0.081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09701694548130035,
"step": 1655,
"valid_targets_mean": 3567.1,
"valid_targets_min": 850
},
{
"epoch": 5.236593059936909,
"grad_norm": 0.34934506488749156,
"learning_rate": 2.6965509213174777e-05,
"loss": 0.0758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06851125508546829,
"step": 1660,
"valid_targets_mean": 4961.3,
"valid_targets_min": 1014
},
{
"epoch": 5.252365930599369,
"grad_norm": 0.39059286750879313,
"learning_rate": 2.6689663752685334e-05,
"loss": 0.0791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07081689685583115,
"step": 1665,
"valid_targets_mean": 3873.0,
"valid_targets_min": 442
},
{
"epoch": 5.26813880126183,
"grad_norm": 0.4374595810187239,
"learning_rate": 2.641472184260809e-05,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0809621810913086,
"step": 1670,
"valid_targets_mean": 3478.6,
"valid_targets_min": 1393
},
{
"epoch": 5.28391167192429,
"grad_norm": 0.42133117621400595,
"learning_rate": 2.614069414018428e-05,
"loss": 0.0758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08253119140863419,
"step": 1675,
"valid_targets_mean": 3928.3,
"valid_targets_min": 814
},
{
"epoch": 5.299684542586751,
"grad_norm": 0.4013385383890111,
"learning_rate": 2.5867591267218805e-05,
"loss": 0.0818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08884066343307495,
"step": 1680,
"valid_targets_mean": 4909.7,
"valid_targets_min": 1545
},
{
"epoch": 5.315457413249211,
"grad_norm": 0.39344189247215844,
"learning_rate": 2.5595423809668452e-05,
"loss": 0.076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07590728253126144,
"step": 1685,
"valid_targets_mean": 4204.9,
"valid_targets_min": 875
},
{
"epoch": 5.331230283911672,
"grad_norm": 0.3542083009513637,
"learning_rate": 2.532420231723172e-05,
"loss": 0.078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06620984524488449,
"step": 1690,
"valid_targets_mean": 5040.6,
"valid_targets_min": 952
},
{
"epoch": 5.347003154574132,
"grad_norm": 0.3955609190369812,
"learning_rate": 2.5053937302939767e-05,
"loss": 0.0831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07462330162525177,
"step": 1695,
"valid_targets_mean": 3349.1,
"valid_targets_min": 797
},
{
"epoch": 5.3627760252365935,
"grad_norm": 0.40977897760118465,
"learning_rate": 2.4784639242748953e-05,
"loss": 0.0824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0794137567281723,
"step": 1700,
"valid_targets_mean": 3732.3,
"valid_targets_min": 335
},
{
"epoch": 5.378548895899054,
"grad_norm": 0.3936043142614415,
"learning_rate": 2.451631857513472e-05,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0751621276140213,
"step": 1705,
"valid_targets_mean": 3926.6,
"valid_targets_min": 1082
},
{
"epoch": 5.394321766561514,
"grad_norm": 0.39725808754116887,
"learning_rate": 2.4248985700687084e-05,
"loss": 0.0891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0900493860244751,
"step": 1710,
"valid_targets_mean": 4563.2,
"valid_targets_min": 847
},
{
"epoch": 5.410094637223975,
"grad_norm": 0.38859670174776123,
"learning_rate": 2.39826509817074e-05,
"loss": 0.0751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06861039251089096,
"step": 1715,
"valid_targets_mean": 3246.6,
"valid_targets_min": 988
},
{
"epoch": 5.425867507886435,
"grad_norm": 0.3977406185047871,
"learning_rate": 2.3717324741806718e-05,
"loss": 0.0775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07713861018419266,
"step": 1720,
"valid_targets_mean": 4137.5,
"valid_targets_min": 827
},
{
"epoch": 5.441640378548896,
"grad_norm": 0.3880850246395261,
"learning_rate": 2.3453017265505673e-05,
"loss": 0.0856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07314358651638031,
"step": 1725,
"valid_targets_mean": 3994.6,
"valid_targets_min": 615
},
{
"epoch": 5.457413249211356,
"grad_norm": 0.3673248293665118,
"learning_rate": 2.3189738797835708e-05,
"loss": 0.0788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07732352614402771,
"step": 1730,
"valid_targets_mean": 4492.2,
"valid_targets_min": 814
},
{
"epoch": 5.473186119873817,
"grad_norm": 0.39818019842028823,
"learning_rate": 2.292749954394216e-05,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09227725863456726,
"step": 1735,
"valid_targets_mean": 4683.8,
"valid_targets_min": 973
},
{
"epoch": 5.488958990536277,
"grad_norm": 0.440987757424753,
"learning_rate": 2.266630966868852e-05,
"loss": 0.0846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10240776091814041,
"step": 1740,
"valid_targets_mean": 3867.3,
"valid_targets_min": 926
},
{
"epoch": 5.504731861198739,
"grad_norm": 0.4048674586856181,
"learning_rate": 2.2406179296262453e-05,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0714288204908371,
"step": 1745,
"valid_targets_mean": 3286.0,
"valid_targets_min": 811
},
{
"epoch": 5.520504731861199,
"grad_norm": 0.4145008180790608,
"learning_rate": 2.2147118509783445e-05,
"loss": 0.0821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08144058287143707,
"step": 1750,
"valid_targets_mean": 3699.2,
"valid_targets_min": 702
},
{
"epoch": 5.5362776025236595,
"grad_norm": 0.40904048276023325,
"learning_rate": 2.1889137350911894e-05,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08297403901815414,
"step": 1755,
"valid_targets_mean": 3566.0,
"valid_targets_min": 983
},
{
"epoch": 5.55205047318612,
"grad_norm": 0.40162391892165394,
"learning_rate": 2.1632245819459913e-05,
"loss": 0.0814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07219391316175461,
"step": 1760,
"valid_targets_mean": 4101.7,
"valid_targets_min": 658
},
{
"epoch": 5.5678233438485805,
"grad_norm": 0.3716162176336755,
"learning_rate": 2.1376453873003664e-05,
"loss": 0.0729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07064441591501236,
"step": 1765,
"valid_targets_mean": 4033.3,
"valid_targets_min": 699
},
{
"epoch": 5.583596214511041,
"grad_norm": 0.38872515423031256,
"learning_rate": 2.112177142649746e-05,
"loss": 0.0825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07718878984451294,
"step": 1770,
"valid_targets_mean": 4244.6,
"valid_targets_min": 646
},
{
"epoch": 5.599369085173501,
"grad_norm": 0.41942771920686045,
"learning_rate": 2.0868208351889402e-05,
"loss": 0.0767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08104390650987625,
"step": 1775,
"valid_targets_mean": 3666.8,
"valid_targets_min": 1210
},
{
"epoch": 5.615141955835962,
"grad_norm": 0.4011121159572857,
"learning_rate": 2.0615774477738738e-05,
"loss": 0.0829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09074635058641434,
"step": 1780,
"valid_targets_mean": 4433.3,
"valid_targets_min": 1053
},
{
"epoch": 5.630914826498422,
"grad_norm": 0.3756850116684875,
"learning_rate": 2.0364479588834835e-05,
"loss": 0.0808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07267570495605469,
"step": 1785,
"valid_targets_mean": 3606.8,
"valid_targets_min": 1072
},
{
"epoch": 5.646687697160884,
"grad_norm": 0.3809432143334385,
"learning_rate": 2.0114333425817993e-05,
"loss": 0.0884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07739441841840744,
"step": 1790,
"valid_targets_mean": 3818.2,
"valid_targets_min": 1093
},
{
"epoch": 5.662460567823344,
"grad_norm": 0.42215943694545005,
"learning_rate": 1.9865345684801846e-05,
"loss": 0.0787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08445312082767487,
"step": 1795,
"valid_targets_mean": 4031.2,
"valid_targets_min": 875
},
{
"epoch": 5.678233438485805,
"grad_norm": 0.44133345444932687,
"learning_rate": 1.9617526016997486e-05,
"loss": 0.0819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09316886961460114,
"step": 1800,
"valid_targets_mean": 3595.4,
"valid_targets_min": 827
},
{
"epoch": 5.694006309148265,
"grad_norm": 0.4028659473927513,
"learning_rate": 1.937088402833943e-05,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07645547389984131,
"step": 1805,
"valid_targets_mean": 3580.8,
"valid_targets_min": 1354
},
{
"epoch": 5.709779179810726,
"grad_norm": 0.3688483280116813,
"learning_rate": 1.9125429279113173e-05,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07246281206607819,
"step": 1810,
"valid_targets_mean": 4382.7,
"valid_targets_min": 1097
},
{
"epoch": 5.725552050473186,
"grad_norm": 0.4214260085884563,
"learning_rate": 1.8881171283584752e-05,
"loss": 0.0773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07776229083538055,
"step": 1815,
"valid_targets_mean": 3844.8,
"valid_targets_min": 604
},
{
"epoch": 5.7413249211356465,
"grad_norm": 0.4179569614889491,
"learning_rate": 1.8638119509631853e-05,
"loss": 0.0843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08015948534011841,
"step": 1820,
"valid_targets_mean": 3177.2,
"valid_targets_min": 1444
},
{
"epoch": 5.757097791798107,
"grad_norm": 0.4128154611167564,
"learning_rate": 1.839628337837686e-05,
"loss": 0.0798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0777365192770958,
"step": 1825,
"valid_targets_mean": 3667.2,
"valid_targets_min": 771
},
{
"epoch": 5.7728706624605675,
"grad_norm": 0.40473025860177675,
"learning_rate": 1.8155672263821666e-05,
"loss": 0.0791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08187016099691391,
"step": 1830,
"valid_targets_mean": 3946.0,
"valid_targets_min": 1158
},
{
"epoch": 5.788643533123029,
"grad_norm": 0.4071920066237988,
"learning_rate": 1.7916295492484315e-05,
"loss": 0.0823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08413612842559814,
"step": 1835,
"valid_targets_mean": 3472.1,
"valid_targets_min": 1127
},
{
"epoch": 5.804416403785489,
"grad_norm": 0.445650703253756,
"learning_rate": 1.7678162343037524e-05,
"loss": 0.0889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08886728435754776,
"step": 1840,
"valid_targets_mean": 3285.9,
"valid_targets_min": 828
},
{
"epoch": 5.82018927444795,
"grad_norm": 0.45763369485934957,
"learning_rate": 1.744128204594893e-05,
"loss": 0.0728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08573994040489197,
"step": 1845,
"valid_targets_mean": 3639.5,
"valid_targets_min": 1063
},
{
"epoch": 5.83596214511041,
"grad_norm": 0.40548342584984587,
"learning_rate": 1.7205663783123436e-05,
"loss": 0.083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07565011829137802,
"step": 1850,
"valid_targets_mean": 3692.7,
"valid_targets_min": 1781
},
{
"epoch": 5.851735015772871,
"grad_norm": 0.3967368097642185,
"learning_rate": 1.6971316687547213e-05,
"loss": 0.0759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07565818727016449,
"step": 1855,
"valid_targets_mean": 3699.7,
"valid_targets_min": 782
},
{
"epoch": 5.867507886435331,
"grad_norm": 0.3858704903050818,
"learning_rate": 1.6738249842933697e-05,
"loss": 0.0804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07207715511322021,
"step": 1860,
"valid_targets_mean": 3578.0,
"valid_targets_min": 702
},
{
"epoch": 5.883280757097792,
"grad_norm": 0.4145062078348231,
"learning_rate": 1.6506472283371527e-05,
"loss": 0.0753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0762171596288681,
"step": 1865,
"valid_targets_mean": 3325.8,
"valid_targets_min": 873
},
{
"epoch": 5.899053627760252,
"grad_norm": 0.4057325123132319,
"learning_rate": 1.6275992992974308e-05,
"loss": 0.0734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07129954546689987,
"step": 1870,
"valid_targets_mean": 3912.2,
"valid_targets_min": 1032
},
{
"epoch": 5.914826498422713,
"grad_norm": 0.3837253838222537,
"learning_rate": 1.604682090553243e-05,
"loss": 0.077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06977653503417969,
"step": 1875,
"valid_targets_mean": 3829.0,
"valid_targets_min": 1345
},
{
"epoch": 5.930599369085174,
"grad_norm": 0.3768656129657237,
"learning_rate": 1.5818964904166756e-05,
"loss": 0.0795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08876457065343857,
"step": 1880,
"valid_targets_mean": 4444.9,
"valid_targets_min": 743
},
{
"epoch": 5.946372239747634,
"grad_norm": 0.42683847888241805,
"learning_rate": 1.55924338209843e-05,
"loss": 0.0806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09318177402019501,
"step": 1885,
"valid_targets_mean": 3591.9,
"valid_targets_min": 851
},
{
"epoch": 5.962145110410095,
"grad_norm": 0.4563886592811939,
"learning_rate": 1.536723643673582e-05,
"loss": 0.0822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0869009792804718,
"step": 1890,
"valid_targets_mean": 3317.4,
"valid_targets_min": 897
},
{
"epoch": 5.977917981072555,
"grad_norm": 0.4058601731267914,
"learning_rate": 1.5143381480475583e-05,
"loss": 0.0835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08817443996667862,
"step": 1895,
"valid_targets_mean": 4137.1,
"valid_targets_min": 687
},
{
"epoch": 5.993690851735016,
"grad_norm": 0.42511998845878957,
"learning_rate": 1.49208776292229e-05,
"loss": 0.0805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08329896628856659,
"step": 1900,
"valid_targets_mean": 3452.4,
"valid_targets_min": 619
},
{
"epoch": 6.009463722397476,
"grad_norm": 0.3423195765299723,
"learning_rate": 1.4699733507625862e-05,
"loss": 0.0539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04928043857216835,
"step": 1905,
"valid_targets_mean": 4499.2,
"valid_targets_min": 721
},
{
"epoch": 6.025236593059937,
"grad_norm": 0.42895594904272516,
"learning_rate": 1.4479957687626933e-05,
"loss": 0.0445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04039411246776581,
"step": 1910,
"valid_targets_mean": 3946.0,
"valid_targets_min": 918
},
{
"epoch": 6.041009463722397,
"grad_norm": 0.3345370252031064,
"learning_rate": 1.4261558688130838e-05,
"loss": 0.04,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04135072976350784,
"step": 1915,
"valid_targets_mean": 3727.4,
"valid_targets_min": 944
},
{
"epoch": 6.056782334384858,
"grad_norm": 0.31310879384045104,
"learning_rate": 1.4044544974674246e-05,
"loss": 0.0408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03876585513353348,
"step": 1920,
"valid_targets_mean": 3372.8,
"valid_targets_min": 850
},
{
"epoch": 6.072555205047319,
"grad_norm": 0.3557013457592405,
"learning_rate": 1.3828924959097612e-05,
"loss": 0.0375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04300154745578766,
"step": 1925,
"valid_targets_mean": 4150.1,
"valid_targets_min": 1266
},
{
"epoch": 6.0883280757097795,
"grad_norm": 0.3615210747778512,
"learning_rate": 1.3614706999219213e-05,
"loss": 0.0437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043791744858026505,
"step": 1930,
"valid_targets_mean": 3000.1,
"valid_targets_min": 828
},
{
"epoch": 6.10410094637224,
"grad_norm": 0.33923014031111215,
"learning_rate": 1.340189939851112e-05,
"loss": 0.0382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04425927996635437,
"step": 1935,
"valid_targets_mean": 3822.5,
"valid_targets_min": 883
},
{
"epoch": 6.1198738170347005,
"grad_norm": 0.30112996820412613,
"learning_rate": 1.3190510405777345e-05,
"loss": 0.0403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03676736354827881,
"step": 1940,
"valid_targets_mean": 4339.9,
"valid_targets_min": 335
},
{
"epoch": 6.135646687697161,
"grad_norm": 0.35740080693164195,
"learning_rate": 1.2980548214834142e-05,
"loss": 0.0411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038491666316986084,
"step": 1945,
"valid_targets_mean": 4319.2,
"valid_targets_min": 968
},
{
"epoch": 6.151419558359621,
"grad_norm": 0.28103551068841687,
"learning_rate": 1.2772020964192316e-05,
"loss": 0.0381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.030903656035661697,
"step": 1950,
"valid_targets_mean": 4118.2,
"valid_targets_min": 635
},
{
"epoch": 6.167192429022082,
"grad_norm": 0.37464024197138274,
"learning_rate": 1.2564936736741867e-05,
"loss": 0.0426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048352181911468506,
"step": 1955,
"valid_targets_mean": 3616.3,
"valid_targets_min": 1179
},
{
"epoch": 6.182965299684542,
"grad_norm": 0.29473480639763844,
"learning_rate": 1.23593035594386e-05,
"loss": 0.0375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03645594045519829,
"step": 1960,
"valid_targets_mean": 4119.2,
"valid_targets_min": 1467
},
{
"epoch": 6.198738170347003,
"grad_norm": 0.31569412821264303,
"learning_rate": 1.215512940299305e-05,
"loss": 0.0379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.031205907464027405,
"step": 1965,
"valid_targets_mean": 3533.7,
"valid_targets_min": 883
},
{
"epoch": 6.214511041009464,
"grad_norm": 0.32535633424487764,
"learning_rate": 1.1952422181561424e-05,
"loss": 0.0399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043385475873947144,
"step": 1970,
"valid_targets_mean": 3445.0,
"valid_targets_min": 948
},
{
"epoch": 6.230283911671925,
"grad_norm": 0.3177206593761059,
"learning_rate": 1.1751189752438957e-05,
"loss": 0.0427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03753677383065224,
"step": 1975,
"valid_targets_mean": 4261.9,
"valid_targets_min": 646
},
{
"epoch": 6.246056782334385,
"grad_norm": 0.3280457853812721,
"learning_rate": 1.1551439915755274e-05,
"loss": 0.0389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034581586718559265,
"step": 1980,
"valid_targets_mean": 3294.8,
"valid_targets_min": 519
},
{
"epoch": 6.261829652996846,
"grad_norm": 0.35275018539696723,
"learning_rate": 1.135318041417207e-05,
"loss": 0.0428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04116068780422211,
"step": 1985,
"valid_targets_mean": 3912.3,
"valid_targets_min": 1342
},
{
"epoch": 6.277602523659306,
"grad_norm": 0.31938399505639403,
"learning_rate": 1.1156418932582941e-05,
"loss": 0.0388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03801509737968445,
"step": 1990,
"valid_targets_mean": 4323.4,
"valid_targets_min": 341
},
{
"epoch": 6.2933753943217665,
"grad_norm": 0.33917209363685086,
"learning_rate": 1.096116309781558e-05,
"loss": 0.0391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04274391382932663,
"step": 1995,
"valid_targets_mean": 4026.5,
"valid_targets_min": 1491
},
{
"epoch": 6.309148264984227,
"grad_norm": 0.3325282925211043,
"learning_rate": 1.0767420478336093e-05,
"loss": 0.0414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03704637289047241,
"step": 2000,
"valid_targets_mean": 4074.3,
"valid_targets_min": 1068
},
{
"epoch": 6.3249211356466875,
"grad_norm": 0.37053697656386647,
"learning_rate": 1.0575198583955698e-05,
"loss": 0.042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04724776744842529,
"step": 2005,
"valid_targets_mean": 3510.2,
"valid_targets_min": 356
},
{
"epoch": 6.340694006309148,
"grad_norm": 0.3031965212003397,
"learning_rate": 1.0384504865539497e-05,
"loss": 0.0418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043518148362636566,
"step": 2010,
"valid_targets_mean": 4591.8,
"valid_targets_min": 637
},
{
"epoch": 6.356466876971609,
"grad_norm": 0.3245643524022609,
"learning_rate": 1.0195346714717813e-05,
"loss": 0.0374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03330378234386444,
"step": 2015,
"valid_targets_mean": 3551.2,
"valid_targets_min": 1164
},
{
"epoch": 6.37223974763407,
"grad_norm": 0.35181283985023565,
"learning_rate": 1.0007731463599601e-05,
"loss": 0.0417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04024139419198036,
"step": 2020,
"valid_targets_mean": 3170.5,
"valid_targets_min": 592
},
{
"epoch": 6.38801261829653,
"grad_norm": 0.34299218359203976,
"learning_rate": 9.82166638448827e-06,
"loss": 0.0404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039584726095199585,
"step": 2025,
"valid_targets_mean": 3978.4,
"valid_targets_min": 910
},
{
"epoch": 6.403785488958991,
"grad_norm": 0.33522795043617415,
"learning_rate": 9.637158689599746e-06,
"loss": 0.042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03583469241857529,
"step": 2030,
"valid_targets_mean": 3679.2,
"valid_targets_min": 814
},
{
"epoch": 6.419558359621451,
"grad_norm": 0.32363944460272953,
"learning_rate": 9.454215530782994e-06,
"loss": 0.0422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04818218946456909,
"step": 2035,
"valid_targets_mean": 4480.6,
"valid_targets_min": 1063
},
{
"epoch": 6.435331230283912,
"grad_norm": 0.30372102594833117,
"learning_rate": 9.272843999242736e-06,
"loss": 0.041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03335719555616379,
"step": 2040,
"valid_targets_mean": 3853.0,
"valid_targets_min": 1406
},
{
"epoch": 6.451104100946372,
"grad_norm": 0.3671546063188256,
"learning_rate": 9.093051125264623e-06,
"loss": 0.041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0437227264046669,
"step": 2045,
"valid_targets_mean": 3309.1,
"valid_targets_min": 765
},
{
"epoch": 6.466876971608833,
"grad_norm": 0.3328681104217597,
"learning_rate": 8.91484387794267e-06,
"loss": 0.0395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03580016642808914,
"step": 2050,
"valid_targets_mean": 3748.2,
"valid_targets_min": 570
},
{
"epoch": 6.482649842271293,
"grad_norm": 0.3662060321902368,
"learning_rate": 8.73822916490919e-06,
"loss": 0.0421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055983349680900574,
"step": 2055,
"valid_targets_mean": 3675.6,
"valid_targets_min": 704
},
{
"epoch": 6.498422712933754,
"grad_norm": 0.34580136378911885,
"learning_rate": 8.563213832067014e-06,
"loss": 0.0394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037559874355793,
"step": 2060,
"valid_targets_mean": 3501.8,
"valid_targets_min": 1329
},
{
"epoch": 6.514195583596215,
"grad_norm": 0.345320359793692,
"learning_rate": 8.389804663324142e-06,
"loss": 0.0402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040657106786966324,
"step": 2065,
"valid_targets_mean": 3831.7,
"valid_targets_min": 841
},
{
"epoch": 6.529968454258675,
"grad_norm": 0.3371252768221188,
"learning_rate": 8.218008380330723e-06,
"loss": 0.0421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04118881747126579,
"step": 2070,
"valid_targets_mean": 3966.3,
"valid_targets_min": 961
},
{
"epoch": 6.545741324921136,
"grad_norm": 0.3012902209870019,
"learning_rate": 8.047831642218611e-06,
"loss": 0.0423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03993421420454979,
"step": 2075,
"valid_targets_mean": 4332.0,
"valid_targets_min": 1194
},
{
"epoch": 6.561514195583596,
"grad_norm": 0.2765052846744795,
"learning_rate": 7.879281045343184e-06,
"loss": 0.0398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03392912447452545,
"step": 2080,
"valid_targets_mean": 5162.8,
"valid_targets_min": 868
},
{
"epoch": 6.577287066246057,
"grad_norm": 0.3295787559358221,
"learning_rate": 7.712363123027678e-06,
"loss": 0.0399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03678988665342331,
"step": 2085,
"valid_targets_mean": 3544.0,
"valid_targets_min": 747
},
{
"epoch": 6.593059936908517,
"grad_norm": 0.3372733751760112,
"learning_rate": 7.547084345309924e-06,
"loss": 0.0395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04084780439734459,
"step": 2090,
"valid_targets_mean": 3407.8,
"valid_targets_min": 1283
},
{
"epoch": 6.608832807570978,
"grad_norm": 0.33791441111307363,
"learning_rate": 7.383451118691576e-06,
"loss": 0.0381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.035366613417863846,
"step": 2095,
"valid_targets_mean": 3889.1,
"valid_targets_min": 1538
},
{
"epoch": 6.624605678233438,
"grad_norm": 0.33176711428490663,
"learning_rate": 7.221469785889784e-06,
"loss": 0.0399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041747353971004486,
"step": 2100,
"valid_targets_mean": 3948.8,
"valid_targets_min": 1238
},
{
"epoch": 6.6403785488958995,
"grad_norm": 0.5978543493140935,
"learning_rate": 7.061146625591331e-06,
"loss": 0.0397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.049385398626327515,
"step": 2105,
"valid_targets_mean": 3850.4,
"valid_targets_min": 809
},
{
"epoch": 6.65615141955836,
"grad_norm": 0.3454267755353442,
"learning_rate": 6.902487852209238e-06,
"loss": 0.0372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04414697363972664,
"step": 2110,
"valid_targets_mean": 4047.8,
"valid_targets_min": 750
},
{
"epoch": 6.6719242902208205,
"grad_norm": 0.29185414383492303,
"learning_rate": 6.7454996156419485e-06,
"loss": 0.0364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034449975937604904,
"step": 2115,
"valid_targets_mean": 4683.7,
"valid_targets_min": 1094
},
{
"epoch": 6.687697160883281,
"grad_norm": 0.34219816454313545,
"learning_rate": 6.590188001034864e-06,
"loss": 0.0377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04172135889530182,
"step": 2120,
"valid_targets_mean": 3884.6,
"valid_targets_min": 1086
},
{
"epoch": 6.703470031545741,
"grad_norm": 0.3369809868933638,
"learning_rate": 6.436559028544559e-06,
"loss": 0.0395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03876055032014847,
"step": 2125,
"valid_targets_mean": 3708.0,
"valid_targets_min": 977
},
{
"epoch": 6.719242902208202,
"grad_norm": 0.315311974215639,
"learning_rate": 6.284618653105328e-06,
"loss": 0.0391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03876154497265816,
"step": 2130,
"valid_targets_mean": 3923.0,
"valid_targets_min": 1289
},
{
"epoch": 6.735015772870662,
"grad_norm": 0.3373353918960485,
"learning_rate": 6.134372764198465e-06,
"loss": 0.0394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0393822006881237,
"step": 2135,
"valid_targets_mean": 3684.7,
"valid_targets_min": 925
},
{
"epoch": 6.750788643533123,
"grad_norm": 0.32392467184278273,
"learning_rate": 5.985827185623899e-06,
"loss": 0.0363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03698527812957764,
"step": 2140,
"valid_targets_mean": 3927.2,
"valid_targets_min": 238
},
{
"epoch": 6.766561514195583,
"grad_norm": 0.3443965456972307,
"learning_rate": 5.8389876752745045e-06,
"loss": 0.0402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.038646962493658066,
"step": 2145,
"valid_targets_mean": 3486.0,
"valid_targets_min": 906
},
{
"epoch": 6.782334384858045,
"grad_norm": 0.32713151736206264,
"learning_rate": 5.693859924912892e-06,
"loss": 0.0384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0415056087076664,
"step": 2150,
"valid_targets_mean": 4044.9,
"valid_targets_min": 1097
},
{
"epoch": 6.798107255520505,
"grad_norm": 0.30958861178255653,
"learning_rate": 5.550449559950755e-06,
"loss": 0.0373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03296856954693794,
"step": 2155,
"valid_targets_mean": 3729.6,
"valid_targets_min": 1001
},
{
"epoch": 6.813880126182966,
"grad_norm": 0.29552798234216193,
"learning_rate": 5.408762139230888e-06,
"loss": 0.0389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03640144318342209,
"step": 2160,
"valid_targets_mean": 4315.6,
"valid_targets_min": 693
},
{
"epoch": 6.829652996845426,
"grad_norm": 0.34460179052643625,
"learning_rate": 5.268803154811669e-06,
"loss": 0.0359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03762969374656677,
"step": 2165,
"valid_targets_mean": 3706.4,
"valid_targets_min": 1109
},
{
"epoch": 6.8454258675078865,
"grad_norm": 0.31528346088217085,
"learning_rate": 5.1305780317541855e-06,
"loss": 0.0414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040562450885772705,
"step": 2170,
"valid_targets_mean": 4305.6,
"valid_targets_min": 1330
},
{
"epoch": 6.861198738170347,
"grad_norm": 0.3122264620036574,
"learning_rate": 4.99409212791192e-06,
"loss": 0.0393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040793538093566895,
"step": 2175,
"valid_targets_mean": 4401.1,
"valid_targets_min": 734
},
{
"epoch": 6.8769716088328074,
"grad_norm": 0.31459386735001565,
"learning_rate": 4.8593507337231666e-06,
"loss": 0.0419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0354890376329422,
"step": 2180,
"valid_targets_mean": 3697.2,
"valid_targets_min": 825
},
{
"epoch": 6.892744479495268,
"grad_norm": 0.32466893557156645,
"learning_rate": 4.726359072005859e-06,
"loss": 0.0429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03945270925760269,
"step": 2185,
"valid_targets_mean": 3481.8,
"valid_targets_min": 1082
},
{
"epoch": 6.908517350157728,
"grad_norm": 0.3333960510985479,
"learning_rate": 4.5951222977551444e-06,
"loss": 0.0414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05161520838737488,
"step": 2190,
"valid_targets_mean": 3759.1,
"valid_targets_min": 875
},
{
"epoch": 6.92429022082019,
"grad_norm": 0.2667648088422186,
"learning_rate": 4.465645497943621e-06,
"loss": 0.0359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03310135751962662,
"step": 2195,
"valid_targets_mean": 4283.0,
"valid_targets_min": 1244
},
{
"epoch": 6.94006309148265,
"grad_norm": 0.35169135244926236,
"learning_rate": 4.337933691324109e-06,
"loss": 0.0361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04485854506492615,
"step": 2200,
"valid_targets_mean": 3564.5,
"valid_targets_min": 802
},
{
"epoch": 6.955835962145111,
"grad_norm": 0.3454019187343065,
"learning_rate": 4.21199182823514e-06,
"loss": 0.0359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.039734575897455215,
"step": 2205,
"valid_targets_mean": 4191.7,
"valid_targets_min": 780
},
{
"epoch": 6.971608832807571,
"grad_norm": 0.3400328431593489,
"learning_rate": 4.08782479040905e-06,
"loss": 0.0413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03961391746997833,
"step": 2210,
"valid_targets_mean": 3994.3,
"valid_targets_min": 645
},
{
"epoch": 6.987381703470032,
"grad_norm": 0.3445618162748776,
"learning_rate": 3.9654373907827665e-06,
"loss": 0.0391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04041258245706558,
"step": 2215,
"valid_targets_mean": 3696.0,
"valid_targets_min": 1033
},
{
"epoch": 7.003154574132492,
"grad_norm": 0.24808709523615394,
"learning_rate": 3.844834373311257e-06,
"loss": 0.0368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025598838925361633,
"step": 2220,
"valid_targets_mean": 4450.8,
"valid_targets_min": 691
},
{
"epoch": 7.018927444794953,
"grad_norm": 0.20311641174529407,
"learning_rate": 3.7260204127836316e-06,
"loss": 0.0241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02267434261739254,
"step": 2225,
"valid_targets_mean": 4686.9,
"valid_targets_min": 1093
},
{
"epoch": 7.034700315457413,
"grad_norm": 0.2913507276372168,
"learning_rate": 3.609000114641964e-06,
"loss": 0.0222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023478612303733826,
"step": 2230,
"valid_targets_mean": 4037.2,
"valid_targets_min": 1238
},
{
"epoch": 7.0504731861198735,
"grad_norm": 0.25188372175946383,
"learning_rate": 3.4937780148027344e-06,
"loss": 0.021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020064473152160645,
"step": 2235,
"valid_targets_mean": 3790.7,
"valid_targets_min": 1525
},
{
"epoch": 7.066246056782334,
"grad_norm": 0.2799468731885234,
"learning_rate": 3.3803585794810466e-06,
"loss": 0.0219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021671026945114136,
"step": 2240,
"valid_targets_mean": 3482.3,
"valid_targets_min": 1149
},
{
"epoch": 7.082018927444795,
"grad_norm": 0.22901515937297012,
"learning_rate": 3.2687462050175034e-06,
"loss": 0.0233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022264134138822556,
"step": 2245,
"valid_targets_mean": 4568.3,
"valid_targets_min": 442
},
{
"epoch": 7.097791798107256,
"grad_norm": 0.21965871988446903,
"learning_rate": 3.1589452177077815e-06,
"loss": 0.0239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020710987970232964,
"step": 2250,
"valid_targets_mean": 4003.0,
"valid_targets_min": 619
},
{
"epoch": 7.113564668769716,
"grad_norm": 0.2846193782550197,
"learning_rate": 3.0509598736349343e-06,
"loss": 0.0232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027990806847810745,
"step": 2255,
"valid_targets_mean": 3473.4,
"valid_targets_min": 635
},
{
"epoch": 7.129337539432177,
"grad_norm": 0.25342807787240196,
"learning_rate": 2.9447943585044545e-06,
"loss": 0.0209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01980901136994362,
"step": 2260,
"valid_targets_mean": 3686.9,
"valid_targets_min": 949
},
{
"epoch": 7.145110410094637,
"grad_norm": 0.22599689314876098,
"learning_rate": 2.840452787481979e-06,
"loss": 0.0229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022050093859434128,
"step": 2265,
"valid_targets_mean": 4373.3,
"valid_targets_min": 1060
},
{
"epoch": 7.160883280757098,
"grad_norm": 0.28769966313988754,
"learning_rate": 2.7379392050338236e-06,
"loss": 0.0226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02312508039176464,
"step": 2270,
"valid_targets_mean": 3584.4,
"valid_targets_min": 1148
},
{
"epoch": 7.176656151419558,
"grad_norm": 0.260860431305003,
"learning_rate": 2.63725758477017e-06,
"loss": 0.0226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02554130181670189,
"step": 2275,
"valid_targets_mean": 3841.9,
"valid_targets_min": 666
},
{
"epoch": 7.192429022082019,
"grad_norm": 0.24635859173031086,
"learning_rate": 2.5384118292910818e-06,
"loss": 0.0226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021089503541588783,
"step": 2280,
"valid_targets_mean": 3992.6,
"valid_targets_min": 1190
},
{
"epoch": 7.208201892744479,
"grad_norm": 0.2333594074028827,
"learning_rate": 2.4414057700351934e-06,
"loss": 0.0212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020846040919423103,
"step": 2285,
"valid_targets_mean": 3938.8,
"valid_targets_min": 830
},
{
"epoch": 7.2239747634069404,
"grad_norm": 0.25966767492658177,
"learning_rate": 2.34624316713124e-06,
"loss": 0.0229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020981695502996445,
"step": 2290,
"valid_targets_mean": 3504.3,
"valid_targets_min": 1031
},
{
"epoch": 7.239747634069401,
"grad_norm": 0.22153240765470747,
"learning_rate": 2.2529277092522503e-06,
"loss": 0.0226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020532969385385513,
"step": 2295,
"valid_targets_mean": 4253.0,
"valid_targets_min": 972
},
{
"epoch": 7.255520504731861,
"grad_norm": 0.2559811792469891,
"learning_rate": 2.1614630134726367e-06,
"loss": 0.0197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022255118936300278,
"step": 2300,
"valid_targets_mean": 4342.4,
"valid_targets_min": 978
},
{
"epoch": 7.271293375394322,
"grad_norm": 0.22249476827291575,
"learning_rate": 2.0718526251279346e-06,
"loss": 0.0214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020419348031282425,
"step": 2305,
"valid_targets_mean": 4521.8,
"valid_targets_min": 539
},
{
"epoch": 7.287066246056782,
"grad_norm": 0.22883166477771633,
"learning_rate": 1.9841000176774148e-06,
"loss": 0.0214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02150961011648178,
"step": 2310,
"valid_targets_mean": 4188.1,
"valid_targets_min": 1191
},
{
"epoch": 7.302839116719243,
"grad_norm": 0.26440175569833124,
"learning_rate": 1.898208592569406e-06,
"loss": 0.021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022997155785560608,
"step": 2315,
"valid_targets_mean": 3923.1,
"valid_targets_min": 1363
},
{
"epoch": 7.318611987381703,
"grad_norm": 0.24646636085476814,
"learning_rate": 1.8141816791095e-06,
"loss": 0.0236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02459106408059597,
"step": 2320,
"valid_targets_mean": 4077.3,
"valid_targets_min": 1260
},
{
"epoch": 7.334384858044164,
"grad_norm": 0.2474218671338873,
"learning_rate": 1.7320225343314566e-06,
"loss": 0.0211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01931830868124962,
"step": 2325,
"valid_targets_mean": 3470.6,
"valid_targets_min": 771
},
{
"epoch": 7.350157728706624,
"grad_norm": 0.2615793701812396,
"learning_rate": 1.6517343428709975e-06,
"loss": 0.0238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022896194830536842,
"step": 2330,
"valid_targets_mean": 3343.2,
"valid_targets_min": 1106
},
{
"epoch": 7.365930599369086,
"grad_norm": 0.24866049646271576,
"learning_rate": 1.5733202168423055e-06,
"loss": 0.0218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022526774555444717,
"step": 2335,
"valid_targets_mean": 3570.8,
"valid_targets_min": 1111
},
{
"epoch": 7.381703470031546,
"grad_norm": 0.24398100838951153,
"learning_rate": 1.4967831957174606e-06,
"loss": 0.0215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.019462652504444122,
"step": 2340,
"valid_targets_mean": 4364.1,
"valid_targets_min": 780
},
{
"epoch": 7.3974763406940065,
"grad_norm": 0.27051410831935213,
"learning_rate": 1.4221262462085715e-06,
"loss": 0.0251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025676360353827477,
"step": 2345,
"valid_targets_mean": 3603.3,
"valid_targets_min": 604
},
{
"epoch": 7.413249211356467,
"grad_norm": 0.3096679579306045,
"learning_rate": 1.3493522621528088e-06,
"loss": 0.0244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024824511259794235,
"step": 2350,
"valid_targets_mean": 3219.4,
"valid_targets_min": 736
},
{
"epoch": 7.429022082018927,
"grad_norm": 0.252879366286297,
"learning_rate": 1.2784640644002366e-06,
"loss": 0.0214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022230399772524834,
"step": 2355,
"valid_targets_mean": 3287.1,
"valid_targets_min": 742
},
{
"epoch": 7.444794952681388,
"grad_norm": 0.20998147562039438,
"learning_rate": 1.209464400704452e-06,
"loss": 0.0206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01767810247838497,
"step": 2360,
"valid_targets_mean": 4389.2,
"valid_targets_min": 927
},
{
"epoch": 7.460567823343848,
"grad_norm": 0.27043175393365976,
"learning_rate": 1.1423559456160803e-06,
"loss": 0.0223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02215229906141758,
"step": 2365,
"valid_targets_mean": 3194.0,
"valid_targets_min": 925
},
{
"epoch": 7.476340694006309,
"grad_norm": 0.2564017112706904,
"learning_rate": 1.0771413003791253e-06,
"loss": 0.0202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020249977707862854,
"step": 2370,
"valid_targets_mean": 3954.9,
"valid_targets_min": 937
},
{
"epoch": 7.492113564668769,
"grad_norm": 0.22802210655502397,
"learning_rate": 1.0138229928301212e-06,
"loss": 0.0212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018750024959445,
"step": 2375,
"valid_targets_mean": 3741.9,
"valid_targets_min": 821
},
{
"epoch": 7.50788643533123,
"grad_norm": 0.22394765960486246,
"learning_rate": 9.524034773001511e-07,
"loss": 0.0193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016100244596600533,
"step": 2380,
"valid_targets_mean": 3365.4,
"valid_targets_min": 948
},
{
"epoch": 7.523659305993691,
"grad_norm": 0.23405243563989528,
"learning_rate": 8.928851345197165e-07,
"loss": 0.0229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02146870270371437,
"step": 2385,
"valid_targets_mean": 3963.8,
"valid_targets_min": 702
},
{
"epoch": 7.539432176656152,
"grad_norm": 0.22220117881236737,
"learning_rate": 8.352702715264726e-07,
"loss": 0.022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018834460526704788,
"step": 2390,
"valid_targets_mean": 4035.9,
"valid_targets_min": 1400
},
{
"epoch": 7.555205047318612,
"grad_norm": 0.2824422608959941,
"learning_rate": 7.795611215757615e-07,
"loss": 0.0229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02203229069709778,
"step": 2395,
"valid_targets_mean": 3184.9,
"valid_targets_min": 582
},
{
"epoch": 7.570977917981073,
"grad_norm": 0.24152675863727685,
"learning_rate": 7.257598440540802e-07,
"loss": 0.025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020647384226322174,
"step": 2400,
"valid_targets_mean": 3745.3,
"valid_targets_min": 1344
},
{
"epoch": 7.586750788643533,
"grad_norm": 0.25427069001772656,
"learning_rate": 6.738685243953769e-07,
"loss": 0.0245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022360961884260178,
"step": 2405,
"valid_targets_mean": 4033.4,
"valid_targets_min": 1509
},
{
"epoch": 7.6025236593059935,
"grad_norm": 0.2447796849963383,
"learning_rate": 6.238891740002195e-07,
"loss": 0.0213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02267741598188877,
"step": 2410,
"valid_targets_mean": 4396.5,
"valid_targets_min": 704
},
{
"epoch": 7.618296529968454,
"grad_norm": 0.1947016798039757,
"learning_rate": 5.758237301577874e-07,
"loss": 0.0218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017979349941015244,
"step": 2415,
"valid_targets_mean": 4253.2,
"valid_targets_min": 961
},
{
"epoch": 7.634069400630915,
"grad_norm": 0.26242474747372385,
"learning_rate": 5.296740559708413e-07,
"loss": 0.0224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.025327244773507118,
"step": 2420,
"valid_targets_mean": 4355.0,
"valid_targets_min": 1385
},
{
"epoch": 7.649842271293375,
"grad_norm": 0.2873187770068635,
"learning_rate": 4.854419402834709e-07,
"loss": 0.0231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.029193349182605743,
"step": 2425,
"valid_targets_mean": 3987.2,
"valid_targets_min": 1301
},
{
"epoch": 7.665615141955836,
"grad_norm": 0.25080676062406615,
"learning_rate": 4.431290976117497e-07,
"loss": 0.0224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02236909046769142,
"step": 2430,
"valid_targets_mean": 3526.8,
"valid_targets_min": 825
},
{
"epoch": 7.681388012618297,
"grad_norm": 0.2679068276217551,
"learning_rate": 4.0273716807731067e-07,
"loss": 0.0223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02555161528289318,
"step": 2435,
"valid_targets_mean": 3574.3,
"valid_targets_min": 1514
},
{
"epoch": 7.697160883280757,
"grad_norm": 0.2527799820599618,
"learning_rate": 3.642677173437137e-07,
"loss": 0.023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022830359637737274,
"step": 2440,
"valid_targets_mean": 3984.7,
"valid_targets_min": 1429
},
{
"epoch": 7.712933753943218,
"grad_norm": 0.24723303602718177,
"learning_rate": 3.2772223655583857e-07,
"loss": 0.0221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022257965058088303,
"step": 2445,
"valid_targets_mean": 4166.3,
"valid_targets_min": 1078
},
{
"epoch": 7.728706624605678,
"grad_norm": 0.24609326590877015,
"learning_rate": 2.9310214228202013e-07,
"loss": 0.0235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01870781183242798,
"step": 2450,
"valid_targets_mean": 3395.5,
"valid_targets_min": 1175
},
{
"epoch": 7.744479495268139,
"grad_norm": 0.2455031161070336,
"learning_rate": 2.604087764591534e-07,
"loss": 0.0219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021903114393353462,
"step": 2455,
"valid_targets_mean": 4218.6,
"valid_targets_min": 867
},
{
"epoch": 7.760252365930599,
"grad_norm": 0.2800194629999433,
"learning_rate": 2.2964340634069603e-07,
"loss": 0.0232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022704198956489563,
"step": 2460,
"valid_targets_mean": 3092.3,
"valid_targets_min": 765
},
{
"epoch": 7.7760252365930596,
"grad_norm": 0.2584271088036407,
"learning_rate": 2.0080722444754118e-07,
"loss": 0.0234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.021550491452217102,
"step": 2465,
"valid_targets_mean": 3626.9,
"valid_targets_min": 380
},
{
"epoch": 7.79179810725552,
"grad_norm": 0.22787140593944627,
"learning_rate": 1.7390134852177664e-07,
"loss": 0.0258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.01774200238287449,
"step": 2470,
"valid_targets_mean": 3878.1,
"valid_targets_min": 964
},
{
"epoch": 7.807570977917981,
"grad_norm": 0.30621669971194165,
"learning_rate": 1.48926821483375e-07,
"loss": 0.0249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0292455293238163,
"step": 2475,
"valid_targets_mean": 3496.4,
"valid_targets_min": 700
},
{
"epoch": 7.823343848580442,
"grad_norm": 0.22754985262911764,
"learning_rate": 1.2588461138977604e-07,
"loss": 0.0205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.020763764157891273,
"step": 2480,
"valid_targets_mean": 4017.9,
"valid_targets_min": 1265
},
{
"epoch": 7.839116719242902,
"grad_norm": 0.24205972437180406,
"learning_rate": 1.0477561139832781e-07,
"loss": 0.024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02504826709628105,
"step": 2485,
"valid_targets_mean": 4303.2,
"valid_targets_min": 882
},
{
"epoch": 7.854889589905363,
"grad_norm": 0.2525430850860654,
"learning_rate": 8.560063973171439e-08,
"loss": 0.0246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.027818750590085983,
"step": 2490,
"valid_targets_mean": 3742.2,
"valid_targets_min": 763
},
{
"epoch": 7.870662460567823,
"grad_norm": 0.21015295804895337,
"learning_rate": 6.836043964620342e-08,
"loss": 0.0213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017499791458249092,
"step": 2495,
"valid_targets_mean": 4126.9,
"valid_targets_min": 1097
},
{
"epoch": 7.886435331230284,
"grad_norm": 0.23969974208310643,
"learning_rate": 5.3055679402846946e-08,
"loss": 0.0222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022856732830405235,
"step": 2500,
"valid_targets_mean": 4013.2,
"valid_targets_min": 1041
},
{
"epoch": 7.902208201892744,
"grad_norm": 0.26209668108487033,
"learning_rate": 3.968695224158547e-08,
"loss": 0.0221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.024923603981733322,
"step": 2505,
"valid_targets_mean": 3558.2,
"valid_targets_min": 1009
},
{
"epoch": 7.917981072555205,
"grad_norm": 0.258239974989192,
"learning_rate": 2.8254776358238588e-08,
"loss": 0.0232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.022169824689626694,
"step": 2510,
"valid_targets_mean": 4173.0,
"valid_targets_min": 1379
},
{
"epoch": 7.933753943217665,
"grad_norm": 0.2103350701053391,
"learning_rate": 1.8759594884443233e-08,
"loss": 0.0214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.017467107623815536,
"step": 2515,
"valid_targets_mean": 4391.8,
"valid_targets_min": 1271
},
{
"epoch": 7.9495268138801265,
"grad_norm": 0.25141140585193267,
"learning_rate": 1.1201775870445242e-08,
"loss": 0.0208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02066458761692047,
"step": 2520,
"valid_targets_mean": 4108.5,
"valid_targets_min": 1098
},
{
"epoch": 7.965299684542587,
"grad_norm": 0.2245523196062546,
"learning_rate": 5.581612270855186e-09,
"loss": 0.0223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.018932700157165527,
"step": 2525,
"valid_targets_mean": 4325.3,
"valid_targets_min": 1171
},
{
"epoch": 7.981072555205047,
"grad_norm": 0.271744707250328,
"learning_rate": 1.8993219332907877e-09,
"loss": 0.0214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.023682236671447754,
"step": 2530,
"valid_targets_mean": 3315.0,
"valid_targets_min": 757
},
{
"epoch": 7.996845425867508,
"grad_norm": 0.26771159667476085,
"learning_rate": 1.5504758992257451e-10,
"loss": 0.0225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.02129640057682991,
"step": 2535,
"valid_targets_mean": 3254.4,
"valid_targets_min": 993
},
{
"epoch": 8.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.016571061685681343,
"step": 2536,
"total_flos": 1378268975529984.0,
"train_loss": 0.16813087239582386,
"train_runtime": 37774.5792,
"train_samples_per_second": 2.146,
"train_steps_per_second": 0.067,
"valid_targets_mean": 4493.3,
"valid_targets_min": 905
}
],
"logging_steps": 5,
"max_steps": 2536,
"num_input_tokens_seen": 0,
"num_train_epochs": 8,
"save_steps": 100,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1378268975529984.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}