Files
a1-wizardlm_orca/trainer_state.json
ModelHub XC 500ddb353f 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-wizardlm_orca
Source: Original Platform
2026-05-02 03:34:10 +08:00

8980 lines
248 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4060,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008620689655172414,
"grad_norm": 13.232932097220655,
"learning_rate": 3.9408866995073894e-07,
"loss": 0.8415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8860415816307068,
"step": 5,
"valid_targets_mean": 2136.3,
"valid_targets_min": 481
},
{
"epoch": 0.017241379310344827,
"grad_norm": 7.697570930444164,
"learning_rate": 8.866995073891626e-07,
"loss": 0.8298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8184617757797241,
"step": 10,
"valid_targets_mean": 5075.8,
"valid_targets_min": 1010
},
{
"epoch": 0.02586206896551724,
"grad_norm": 11.504287176795119,
"learning_rate": 1.3793103448275862e-06,
"loss": 0.8474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8526071310043335,
"step": 15,
"valid_targets_mean": 2459.5,
"valid_targets_min": 519
},
{
"epoch": 0.034482758620689655,
"grad_norm": 11.157594988010677,
"learning_rate": 1.8719211822660098e-06,
"loss": 0.8062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8563398718833923,
"step": 20,
"valid_targets_mean": 2083.9,
"valid_targets_min": 475
},
{
"epoch": 0.04310344827586207,
"grad_norm": 7.454562769727624,
"learning_rate": 2.3645320197044334e-06,
"loss": 0.7396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6408491134643555,
"step": 25,
"valid_targets_mean": 2346.5,
"valid_targets_min": 565
},
{
"epoch": 0.05172413793103448,
"grad_norm": 4.462332245510196,
"learning_rate": 2.8571428571428573e-06,
"loss": 0.7238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5656313896179199,
"step": 30,
"valid_targets_mean": 2104.9,
"valid_targets_min": 510
},
{
"epoch": 0.0603448275862069,
"grad_norm": 3.8825932284325297,
"learning_rate": 3.349753694581281e-06,
"loss": 0.7084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7533521056175232,
"step": 35,
"valid_targets_mean": 1671.2,
"valid_targets_min": 693
},
{
"epoch": 0.06896551724137931,
"grad_norm": 1.722144166921226,
"learning_rate": 3.842364532019705e-06,
"loss": 0.6874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6071873903274536,
"step": 40,
"valid_targets_mean": 3528.5,
"valid_targets_min": 560
},
{
"epoch": 0.07758620689655173,
"grad_norm": 2.321454376114494,
"learning_rate": 4.334975369458129e-06,
"loss": 0.6636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6896767616271973,
"step": 45,
"valid_targets_mean": 1569.0,
"valid_targets_min": 555
},
{
"epoch": 0.08620689655172414,
"grad_norm": 1.2086382136138112,
"learning_rate": 4.8275862068965525e-06,
"loss": 0.6038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5344650745391846,
"step": 50,
"valid_targets_mean": 2312.8,
"valid_targets_min": 599
},
{
"epoch": 0.09482758620689655,
"grad_norm": 0.9529660756316026,
"learning_rate": 5.320197044334976e-06,
"loss": 0.6209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4809268116950989,
"step": 55,
"valid_targets_mean": 2783.3,
"valid_targets_min": 508
},
{
"epoch": 0.10344827586206896,
"grad_norm": 0.780182127462651,
"learning_rate": 5.812807881773399e-06,
"loss": 0.5396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4358481764793396,
"step": 60,
"valid_targets_mean": 3265.1,
"valid_targets_min": 633
},
{
"epoch": 0.11206896551724138,
"grad_norm": 0.9472444738751354,
"learning_rate": 6.305418719211823e-06,
"loss": 0.5647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6075949668884277,
"step": 65,
"valid_targets_mean": 2665.1,
"valid_targets_min": 431
},
{
"epoch": 0.1206896551724138,
"grad_norm": 0.830653122252629,
"learning_rate": 6.798029556650246e-06,
"loss": 0.5177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5087354779243469,
"step": 70,
"valid_targets_mean": 2723.9,
"valid_targets_min": 669
},
{
"epoch": 0.12931034482758622,
"grad_norm": 1.0815877554445863,
"learning_rate": 7.290640394088671e-06,
"loss": 0.5517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.686690092086792,
"step": 75,
"valid_targets_mean": 1865.0,
"valid_targets_min": 644
},
{
"epoch": 0.13793103448275862,
"grad_norm": 1.132738933241941,
"learning_rate": 7.783251231527095e-06,
"loss": 0.6183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5349428653717041,
"step": 80,
"valid_targets_mean": 2359.5,
"valid_targets_min": 887
},
{
"epoch": 0.14655172413793102,
"grad_norm": 0.6591541818226556,
"learning_rate": 8.275862068965518e-06,
"loss": 0.4737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.382580041885376,
"step": 85,
"valid_targets_mean": 3268.1,
"valid_targets_min": 758
},
{
"epoch": 0.15517241379310345,
"grad_norm": 0.9248007332339961,
"learning_rate": 8.768472906403942e-06,
"loss": 0.5053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.527409553527832,
"step": 90,
"valid_targets_mean": 2054.4,
"valid_targets_min": 730
},
{
"epoch": 0.16379310344827586,
"grad_norm": 0.9086933978595335,
"learning_rate": 9.261083743842364e-06,
"loss": 0.5679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6158876419067383,
"step": 95,
"valid_targets_mean": 2684.1,
"valid_targets_min": 427
},
{
"epoch": 0.1724137931034483,
"grad_norm": 0.8976459156554277,
"learning_rate": 9.75369458128079e-06,
"loss": 0.5457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6348117589950562,
"step": 100,
"valid_targets_mean": 2928.3,
"valid_targets_min": 675
},
{
"epoch": 0.1810344827586207,
"grad_norm": 0.902855097961049,
"learning_rate": 1.0246305418719214e-05,
"loss": 0.5007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5758171677589417,
"step": 105,
"valid_targets_mean": 2074.6,
"valid_targets_min": 481
},
{
"epoch": 0.1896551724137931,
"grad_norm": 0.5842031863511825,
"learning_rate": 1.0738916256157637e-05,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38487473130226135,
"step": 110,
"valid_targets_mean": 3755.7,
"valid_targets_min": 586
},
{
"epoch": 0.19827586206896552,
"grad_norm": 0.7740217123427929,
"learning_rate": 1.123152709359606e-05,
"loss": 0.502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43103402853012085,
"step": 115,
"valid_targets_mean": 2872.9,
"valid_targets_min": 647
},
{
"epoch": 0.20689655172413793,
"grad_norm": 0.8902368577963162,
"learning_rate": 1.1724137931034483e-05,
"loss": 0.552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.548175573348999,
"step": 120,
"valid_targets_mean": 2121.9,
"valid_targets_min": 875
},
{
"epoch": 0.21551724137931033,
"grad_norm": 0.8264039936367132,
"learning_rate": 1.2216748768472909e-05,
"loss": 0.4823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4839908480644226,
"step": 125,
"valid_targets_mean": 2181.6,
"valid_targets_min": 603
},
{
"epoch": 0.22413793103448276,
"grad_norm": 0.8450133097474695,
"learning_rate": 1.2709359605911331e-05,
"loss": 0.443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45593246817588806,
"step": 130,
"valid_targets_mean": 2023.6,
"valid_targets_min": 576
},
{
"epoch": 0.23275862068965517,
"grad_norm": 0.5788964343898347,
"learning_rate": 1.3201970443349755e-05,
"loss": 0.5249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3811132609844208,
"step": 135,
"valid_targets_mean": 3966.9,
"valid_targets_min": 1118
},
{
"epoch": 0.2413793103448276,
"grad_norm": 0.7632885346479155,
"learning_rate": 1.369458128078818e-05,
"loss": 0.5116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.56120765209198,
"step": 140,
"valid_targets_mean": 3156.3,
"valid_targets_min": 481
},
{
"epoch": 0.25,
"grad_norm": 0.8620275887963595,
"learning_rate": 1.4187192118226602e-05,
"loss": 0.5083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.53715980052948,
"step": 145,
"valid_targets_mean": 2210.4,
"valid_targets_min": 684
},
{
"epoch": 0.25862068965517243,
"grad_norm": 0.8511906311114458,
"learning_rate": 1.4679802955665026e-05,
"loss": 0.4255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4668218493461609,
"step": 150,
"valid_targets_mean": 2173.1,
"valid_targets_min": 870
},
{
"epoch": 0.2672413793103448,
"grad_norm": 0.7555714152272107,
"learning_rate": 1.5172413793103448e-05,
"loss": 0.4816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37490010261535645,
"step": 155,
"valid_targets_mean": 2356.9,
"valid_targets_min": 538
},
{
"epoch": 0.27586206896551724,
"grad_norm": 0.8402578283696395,
"learning_rate": 1.5665024630541875e-05,
"loss": 0.5105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5459040403366089,
"step": 160,
"valid_targets_mean": 2340.6,
"valid_targets_min": 429
},
{
"epoch": 0.28448275862068967,
"grad_norm": 0.6775840481703621,
"learning_rate": 1.6157635467980298e-05,
"loss": 0.4612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36925819516181946,
"step": 165,
"valid_targets_mean": 2578.4,
"valid_targets_min": 485
},
{
"epoch": 0.29310344827586204,
"grad_norm": 0.780109213871394,
"learning_rate": 1.665024630541872e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5196021795272827,
"step": 170,
"valid_targets_mean": 2996.8,
"valid_targets_min": 1004
},
{
"epoch": 0.3017241379310345,
"grad_norm": 0.8548697531410809,
"learning_rate": 1.7142857142857142e-05,
"loss": 0.4598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4733397662639618,
"step": 175,
"valid_targets_mean": 2293.2,
"valid_targets_min": 569
},
{
"epoch": 0.3103448275862069,
"grad_norm": 0.8546736192908461,
"learning_rate": 1.7635467980295567e-05,
"loss": 0.4672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43413564562797546,
"step": 180,
"valid_targets_mean": 1991.5,
"valid_targets_min": 864
},
{
"epoch": 0.31896551724137934,
"grad_norm": 0.7252441236863357,
"learning_rate": 1.8128078817733993e-05,
"loss": 0.4961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5404946208000183,
"step": 185,
"valid_targets_mean": 3216.4,
"valid_targets_min": 1294
},
{
"epoch": 0.3275862068965517,
"grad_norm": 0.7989378071687083,
"learning_rate": 1.8620689655172415e-05,
"loss": 0.4817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5027145743370056,
"step": 190,
"valid_targets_mean": 2232.9,
"valid_targets_min": 395
},
{
"epoch": 0.33620689655172414,
"grad_norm": 0.7178395258693016,
"learning_rate": 1.911330049261084e-05,
"loss": 0.468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5232639312744141,
"step": 195,
"valid_targets_mean": 3374.6,
"valid_targets_min": 611
},
{
"epoch": 0.3448275862068966,
"grad_norm": 0.6329553171336134,
"learning_rate": 1.9605911330049263e-05,
"loss": 0.4526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4167773425579071,
"step": 200,
"valid_targets_mean": 3209.2,
"valid_targets_min": 485
},
{
"epoch": 0.35344827586206895,
"grad_norm": 0.6728546038871683,
"learning_rate": 2.0098522167487688e-05,
"loss": 0.4307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3922424018383026,
"step": 205,
"valid_targets_mean": 2740.6,
"valid_targets_min": 969
},
{
"epoch": 0.3620689655172414,
"grad_norm": 1.04961738262584,
"learning_rate": 2.059113300492611e-05,
"loss": 0.5102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4533177614212036,
"step": 210,
"valid_targets_mean": 2375.1,
"valid_targets_min": 536
},
{
"epoch": 0.3706896551724138,
"grad_norm": 0.7434878133431768,
"learning_rate": 2.1083743842364536e-05,
"loss": 0.4855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5148615837097168,
"step": 215,
"valid_targets_mean": 3240.9,
"valid_targets_min": 460
},
{
"epoch": 0.3793103448275862,
"grad_norm": 0.7872528477220174,
"learning_rate": 2.1576354679802954e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4126091003417969,
"step": 220,
"valid_targets_mean": 2226.2,
"valid_targets_min": 825
},
{
"epoch": 0.3879310344827586,
"grad_norm": 0.7540671720188216,
"learning_rate": 2.206896551724138e-05,
"loss": 0.4648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4633001387119293,
"step": 225,
"valid_targets_mean": 2634.1,
"valid_targets_min": 660
},
{
"epoch": 0.39655172413793105,
"grad_norm": 0.7420533564001498,
"learning_rate": 2.2561576354679805e-05,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4774375259876251,
"step": 230,
"valid_targets_mean": 2631.4,
"valid_targets_min": 282
},
{
"epoch": 0.4051724137931034,
"grad_norm": 0.6157590867590423,
"learning_rate": 2.3054187192118228e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43844375014305115,
"step": 235,
"valid_targets_mean": 4082.3,
"valid_targets_min": 573
},
{
"epoch": 0.41379310344827586,
"grad_norm": 0.8565991200200499,
"learning_rate": 2.3546798029556653e-05,
"loss": 0.5309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6025887727737427,
"step": 240,
"valid_targets_mean": 2522.6,
"valid_targets_min": 586
},
{
"epoch": 0.4224137931034483,
"grad_norm": 1.2583799529045883,
"learning_rate": 2.403940886699508e-05,
"loss": 0.4855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5208061933517456,
"step": 245,
"valid_targets_mean": 2395.9,
"valid_targets_min": 437
},
{
"epoch": 0.43103448275862066,
"grad_norm": 0.8146647432675135,
"learning_rate": 2.4532019704433497e-05,
"loss": 0.4903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45655834674835205,
"step": 250,
"valid_targets_mean": 2176.9,
"valid_targets_min": 1070
},
{
"epoch": 0.4396551724137931,
"grad_norm": 0.8072309949308645,
"learning_rate": 2.5024630541871923e-05,
"loss": 0.4304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47415584325790405,
"step": 255,
"valid_targets_mean": 2326.9,
"valid_targets_min": 638
},
{
"epoch": 0.4482758620689655,
"grad_norm": 0.8227419849582898,
"learning_rate": 2.551724137931035e-05,
"loss": 0.4459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39482447504997253,
"step": 260,
"valid_targets_mean": 1956.3,
"valid_targets_min": 528
},
{
"epoch": 0.45689655172413796,
"grad_norm": 0.930242183186987,
"learning_rate": 2.600985221674877e-05,
"loss": 0.4728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44298598170280457,
"step": 265,
"valid_targets_mean": 1632.1,
"valid_targets_min": 549
},
{
"epoch": 0.46551724137931033,
"grad_norm": 0.6101603625456252,
"learning_rate": 2.6502463054187196e-05,
"loss": 0.4629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47349387407302856,
"step": 270,
"valid_targets_mean": 4623.9,
"valid_targets_min": 982
},
{
"epoch": 0.47413793103448276,
"grad_norm": 0.9537571622572907,
"learning_rate": 2.6995073891625615e-05,
"loss": 0.5005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47361212968826294,
"step": 275,
"valid_targets_mean": 2541.9,
"valid_targets_min": 723
},
{
"epoch": 0.4827586206896552,
"grad_norm": 0.7408116261053846,
"learning_rate": 2.748768472906404e-05,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5130395889282227,
"step": 280,
"valid_targets_mean": 2848.1,
"valid_targets_min": 933
},
{
"epoch": 0.49137931034482757,
"grad_norm": 0.6817201938253903,
"learning_rate": 2.7980295566502466e-05,
"loss": 0.494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45302706956863403,
"step": 285,
"valid_targets_mean": 3216.0,
"valid_targets_min": 909
},
{
"epoch": 0.5,
"grad_norm": 0.8714105802109559,
"learning_rate": 2.8472906403940888e-05,
"loss": 0.4814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5157756805419922,
"step": 290,
"valid_targets_mean": 2243.6,
"valid_targets_min": 561
},
{
"epoch": 0.5086206896551724,
"grad_norm": 0.7282708487682565,
"learning_rate": 2.8965517241379313e-05,
"loss": 0.4614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39844846725463867,
"step": 295,
"valid_targets_mean": 3180.0,
"valid_targets_min": 644
},
{
"epoch": 0.5172413793103449,
"grad_norm": 0.8975983503967481,
"learning_rate": 2.945812807881774e-05,
"loss": 0.4388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.531843900680542,
"step": 300,
"valid_targets_mean": 1914.1,
"valid_targets_min": 546
},
{
"epoch": 0.5258620689655172,
"grad_norm": 0.8163712348212677,
"learning_rate": 2.9950738916256158e-05,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5456841588020325,
"step": 305,
"valid_targets_mean": 2314.6,
"valid_targets_min": 756
},
{
"epoch": 0.5344827586206896,
"grad_norm": 0.7895716575686172,
"learning_rate": 3.0443349753694583e-05,
"loss": 0.4494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4308232069015503,
"step": 310,
"valid_targets_mean": 2846.6,
"valid_targets_min": 299
},
{
"epoch": 0.5431034482758621,
"grad_norm": 0.6475104958991397,
"learning_rate": 3.093596059113301e-05,
"loss": 0.4426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39463210105895996,
"step": 315,
"valid_targets_mean": 3386.5,
"valid_targets_min": 646
},
{
"epoch": 0.5517241379310345,
"grad_norm": 0.9928118152840254,
"learning_rate": 3.142857142857143e-05,
"loss": 0.478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4573419690132141,
"step": 320,
"valid_targets_mean": 1744.3,
"valid_targets_min": 375
},
{
"epoch": 0.5603448275862069,
"grad_norm": 0.8950697219459826,
"learning_rate": 3.1921182266009856e-05,
"loss": 0.4686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41824567317962646,
"step": 325,
"valid_targets_mean": 1810.9,
"valid_targets_min": 873
},
{
"epoch": 0.5689655172413793,
"grad_norm": 0.8043290863445247,
"learning_rate": 3.2413793103448275e-05,
"loss": 0.4703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5139874815940857,
"step": 330,
"valid_targets_mean": 2277.0,
"valid_targets_min": 773
},
{
"epoch": 0.5775862068965517,
"grad_norm": 0.9413544056683327,
"learning_rate": 3.29064039408867e-05,
"loss": 0.4245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40947747230529785,
"step": 335,
"valid_targets_mean": 1762.7,
"valid_targets_min": 571
},
{
"epoch": 0.5862068965517241,
"grad_norm": 0.6861532735672352,
"learning_rate": 3.3399014778325126e-05,
"loss": 0.463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39968305826187134,
"step": 340,
"valid_targets_mean": 3021.8,
"valid_targets_min": 863
},
{
"epoch": 0.5948275862068966,
"grad_norm": 0.8640437276593032,
"learning_rate": 3.389162561576355e-05,
"loss": 0.4665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43528294563293457,
"step": 345,
"valid_targets_mean": 2015.9,
"valid_targets_min": 626
},
{
"epoch": 0.603448275862069,
"grad_norm": 0.732764848171335,
"learning_rate": 3.438423645320197e-05,
"loss": 0.4797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5329480171203613,
"step": 350,
"valid_targets_mean": 2950.9,
"valid_targets_min": 785
},
{
"epoch": 0.6120689655172413,
"grad_norm": 0.8024994379243645,
"learning_rate": 3.4876847290640396e-05,
"loss": 0.4418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4507256746292114,
"step": 355,
"valid_targets_mean": 2193.6,
"valid_targets_min": 442
},
{
"epoch": 0.6206896551724138,
"grad_norm": 0.8262666854372246,
"learning_rate": 3.536945812807882e-05,
"loss": 0.4798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48532766103744507,
"step": 360,
"valid_targets_mean": 2739.9,
"valid_targets_min": 642
},
{
"epoch": 0.6293103448275862,
"grad_norm": 0.6332844053249423,
"learning_rate": 3.586206896551725e-05,
"loss": 0.4045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3117547035217285,
"step": 365,
"valid_targets_mean": 2887.0,
"valid_targets_min": 617
},
{
"epoch": 0.6379310344827587,
"grad_norm": 0.7460508213663771,
"learning_rate": 3.6354679802955665e-05,
"loss": 0.4704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5197142958641052,
"step": 370,
"valid_targets_mean": 2832.7,
"valid_targets_min": 492
},
{
"epoch": 0.646551724137931,
"grad_norm": 0.5464572201060651,
"learning_rate": 3.684729064039409e-05,
"loss": 0.43,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35164475440979004,
"step": 375,
"valid_targets_mean": 4484.4,
"valid_targets_min": 758
},
{
"epoch": 0.6551724137931034,
"grad_norm": 0.8991528330150939,
"learning_rate": 3.7339901477832516e-05,
"loss": 0.4636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3793317675590515,
"step": 380,
"valid_targets_mean": 1875.5,
"valid_targets_min": 787
},
{
"epoch": 0.6637931034482759,
"grad_norm": 0.6949477428765862,
"learning_rate": 3.7832512315270935e-05,
"loss": 0.4305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4816117286682129,
"step": 385,
"valid_targets_mean": 4579.9,
"valid_targets_min": 611
},
{
"epoch": 0.6724137931034483,
"grad_norm": 0.6593748377546642,
"learning_rate": 3.832512315270936e-05,
"loss": 0.4543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4020620584487915,
"step": 390,
"valid_targets_mean": 2879.8,
"valid_targets_min": 999
},
{
"epoch": 0.6810344827586207,
"grad_norm": 1.0434173212328082,
"learning_rate": 3.8817733990147786e-05,
"loss": 0.4919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5102270245552063,
"step": 395,
"valid_targets_mean": 1963.6,
"valid_targets_min": 531
},
{
"epoch": 0.6896551724137931,
"grad_norm": 0.891541913502292,
"learning_rate": 3.931034482758621e-05,
"loss": 0.4897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5392195582389832,
"step": 400,
"valid_targets_mean": 2574.2,
"valid_targets_min": 757
},
{
"epoch": 0.6982758620689655,
"grad_norm": 1.1541729925888546,
"learning_rate": 3.980295566502464e-05,
"loss": 0.4299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42217105627059937,
"step": 405,
"valid_targets_mean": 2676.6,
"valid_targets_min": 479
},
{
"epoch": 0.7068965517241379,
"grad_norm": 0.7698263830350504,
"learning_rate": 3.999993347192948e-05,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4036504328250885,
"step": 410,
"valid_targets_mean": 2536.8,
"valid_targets_min": 566
},
{
"epoch": 0.7155172413793104,
"grad_norm": 0.7305436039635469,
"learning_rate": 3.9999526913101334e-05,
"loss": 0.4429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45616382360458374,
"step": 415,
"valid_targets_mean": 2623.6,
"valid_targets_min": 740
},
{
"epoch": 0.7241379310344828,
"grad_norm": 0.5924152937193563,
"learning_rate": 3.999875076298832e-05,
"loss": 0.4298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3307499587535858,
"step": 420,
"valid_targets_mean": 3216.8,
"valid_targets_min": 794
},
{
"epoch": 0.7327586206896551,
"grad_norm": 0.7974007037020275,
"learning_rate": 3.9997605035933704e-05,
"loss": 0.4076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3921046555042267,
"step": 425,
"valid_targets_mean": 2243.4,
"valid_targets_min": 584
},
{
"epoch": 0.7413793103448276,
"grad_norm": 0.7809983920045804,
"learning_rate": 3.99960897531105e-05,
"loss": 0.4023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4133235216140747,
"step": 430,
"valid_targets_mean": 2451.4,
"valid_targets_min": 683
},
{
"epoch": 0.75,
"grad_norm": 0.8564857581354621,
"learning_rate": 3.999420494252116e-05,
"loss": 0.4612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.50236976146698,
"step": 435,
"valid_targets_mean": 2297.1,
"valid_targets_min": 607
},
{
"epoch": 0.7586206896551724,
"grad_norm": 0.8282054432302532,
"learning_rate": 3.9991950638996976e-05,
"loss": 0.4775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4601110816001892,
"step": 440,
"valid_targets_mean": 1987.6,
"valid_targets_min": 510
},
{
"epoch": 0.7672413793103449,
"grad_norm": 2.196261301737067,
"learning_rate": 3.998932688419748e-05,
"loss": 0.4424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40777525305747986,
"step": 445,
"valid_targets_mean": 2384.4,
"valid_targets_min": 537
},
{
"epoch": 0.7758620689655172,
"grad_norm": 0.7767034549725097,
"learning_rate": 3.9986333726609674e-05,
"loss": 0.4409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40235668420791626,
"step": 450,
"valid_targets_mean": 2375.9,
"valid_targets_min": 389
},
{
"epoch": 0.7844827586206896,
"grad_norm": 0.8868383113758573,
"learning_rate": 3.99829712215471e-05,
"loss": 0.4696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4738074839115143,
"step": 455,
"valid_targets_mean": 2075.4,
"valid_targets_min": 613
},
{
"epoch": 0.7931034482758621,
"grad_norm": 0.8653398113931736,
"learning_rate": 3.997923943114886e-05,
"loss": 0.4595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48855382204055786,
"step": 460,
"valid_targets_mean": 3139.3,
"valid_targets_min": 956
},
{
"epoch": 0.8017241379310345,
"grad_norm": 0.683892302463927,
"learning_rate": 3.997513842437845e-05,
"loss": 0.4311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36282363533973694,
"step": 465,
"valid_targets_mean": 2642.1,
"valid_targets_min": 768
},
{
"epoch": 0.8103448275862069,
"grad_norm": 0.9752721796080772,
"learning_rate": 3.997066827702248e-05,
"loss": 0.4858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4777313768863678,
"step": 470,
"valid_targets_mean": 1706.8,
"valid_targets_min": 696
},
{
"epoch": 0.8189655172413793,
"grad_norm": 0.6314778562370668,
"learning_rate": 3.996582907168928e-05,
"loss": 0.5172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4231725335121155,
"step": 475,
"valid_targets_mean": 3065.4,
"valid_targets_min": 769
},
{
"epoch": 0.8275862068965517,
"grad_norm": 0.8832569013931396,
"learning_rate": 3.996062089780737e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3854944705963135,
"step": 480,
"valid_targets_mean": 2018.0,
"valid_targets_min": 904
},
{
"epoch": 0.8362068965517241,
"grad_norm": 0.6652631917767244,
"learning_rate": 3.99550438516238e-05,
"loss": 0.5466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4254167377948761,
"step": 485,
"valid_targets_mean": 3028.4,
"valid_targets_min": 513
},
{
"epoch": 0.8448275862068966,
"grad_norm": 0.7597451955001047,
"learning_rate": 3.994909803620241e-05,
"loss": 0.456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44718462228775024,
"step": 490,
"valid_targets_mean": 2557.1,
"valid_targets_min": 454
},
{
"epoch": 0.853448275862069,
"grad_norm": 0.6578252774007807,
"learning_rate": 3.994278356142187e-05,
"loss": 0.4461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44781360030174255,
"step": 495,
"valid_targets_mean": 2988.4,
"valid_targets_min": 761
},
{
"epoch": 0.8620689655172413,
"grad_norm": 0.7262448958158562,
"learning_rate": 3.993610054397368e-05,
"loss": 0.4587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3711667060852051,
"step": 500,
"valid_targets_mean": 2528.9,
"valid_targets_min": 632
},
{
"epoch": 0.8706896551724138,
"grad_norm": 0.7147220841254082,
"learning_rate": 3.992904910736001e-05,
"loss": 0.4604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.397768497467041,
"step": 505,
"valid_targets_mean": 2382.1,
"valid_targets_min": 600
},
{
"epoch": 0.8793103448275862,
"grad_norm": 0.6122583548543834,
"learning_rate": 3.9921629381891425e-05,
"loss": 0.39,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4616737365722656,
"step": 510,
"valid_targets_mean": 3468.6,
"valid_targets_min": 700
},
{
"epoch": 0.8879310344827587,
"grad_norm": 0.6885272133475613,
"learning_rate": 3.991384150468445e-05,
"loss": 0.4546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.431570440530777,
"step": 515,
"valid_targets_mean": 2822.1,
"valid_targets_min": 414
},
{
"epoch": 0.896551724137931,
"grad_norm": 0.6550575188514011,
"learning_rate": 3.9905685619659074e-05,
"loss": 0.444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3826547861099243,
"step": 520,
"valid_targets_mean": 3025.6,
"valid_targets_min": 527
},
{
"epoch": 0.9051724137931034,
"grad_norm": 0.7376316328489212,
"learning_rate": 3.9897161877536076e-05,
"loss": 0.4599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44813811779022217,
"step": 525,
"valid_targets_mean": 2054.6,
"valid_targets_min": 545
},
{
"epoch": 0.9137931034482759,
"grad_norm": 0.6800801555525916,
"learning_rate": 3.9888270435834196e-05,
"loss": 0.4432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3814975917339325,
"step": 530,
"valid_targets_mean": 2481.4,
"valid_targets_min": 650
},
{
"epoch": 0.9224137931034483,
"grad_norm": 0.678026309874535,
"learning_rate": 3.987901145886731e-05,
"loss": 0.4055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.454716295003891,
"step": 535,
"valid_targets_mean": 3485.5,
"valid_targets_min": 522
},
{
"epoch": 0.9310344827586207,
"grad_norm": 0.733184976085652,
"learning_rate": 3.9869385117741314e-05,
"loss": 0.4626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42944812774658203,
"step": 540,
"valid_targets_mean": 2215.9,
"valid_targets_min": 412
},
{
"epoch": 0.9396551724137931,
"grad_norm": 0.7245253036454354,
"learning_rate": 3.985939159035101e-05,
"loss": 0.3871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40529000759124756,
"step": 545,
"valid_targets_mean": 2216.6,
"valid_targets_min": 441
},
{
"epoch": 0.9482758620689655,
"grad_norm": 0.8082542554339605,
"learning_rate": 3.98490310613768e-05,
"loss": 0.4763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5691283345222473,
"step": 550,
"valid_targets_mean": 2477.1,
"valid_targets_min": 609
},
{
"epoch": 0.9568965517241379,
"grad_norm": 0.6170643339917548,
"learning_rate": 3.983830372228127e-05,
"loss": 0.4762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4863627552986145,
"step": 555,
"valid_targets_mean": 3696.4,
"valid_targets_min": 845
},
{
"epoch": 0.9655172413793104,
"grad_norm": 0.828710236174964,
"learning_rate": 3.982720977130567e-05,
"loss": 0.4584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5036779642105103,
"step": 560,
"valid_targets_mean": 2395.6,
"valid_targets_min": 843
},
{
"epoch": 0.9741379310344828,
"grad_norm": 0.8786478661180452,
"learning_rate": 3.9815749413466204e-05,
"loss": 0.4184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46909040212631226,
"step": 565,
"valid_targets_mean": 1995.8,
"valid_targets_min": 790
},
{
"epoch": 0.9827586206896551,
"grad_norm": 0.7947261832670387,
"learning_rate": 3.980392286055033e-05,
"loss": 0.4518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4978959262371063,
"step": 570,
"valid_targets_mean": 2086.5,
"valid_targets_min": 735
},
{
"epoch": 0.9913793103448276,
"grad_norm": 0.7098014379889231,
"learning_rate": 3.979173033111275e-05,
"loss": 0.3977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4036133289337158,
"step": 575,
"valid_targets_mean": 2342.9,
"valid_targets_min": 792
},
{
"epoch": 1.0,
"grad_norm": 0.6775755166421004,
"learning_rate": 3.977917205047142e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4571645259857178,
"step": 580,
"valid_targets_mean": 2889.3,
"valid_targets_min": 1027
},
{
"epoch": 1.0086206896551724,
"grad_norm": 0.6102387669296445,
"learning_rate": 3.976624825070339e-05,
"loss": 0.3625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29137107729911804,
"step": 585,
"valid_targets_mean": 2821.2,
"valid_targets_min": 624
},
{
"epoch": 1.0172413793103448,
"grad_norm": 0.6197666440180915,
"learning_rate": 3.97529591706405e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37029892206192017,
"step": 590,
"valid_targets_mean": 2887.8,
"valid_targets_min": 580
},
{
"epoch": 1.0258620689655173,
"grad_norm": 0.8840160427547796,
"learning_rate": 3.973930505586496e-05,
"loss": 0.4321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4517512321472168,
"step": 595,
"valid_targets_mean": 1778.4,
"valid_targets_min": 633
},
{
"epoch": 1.0344827586206897,
"grad_norm": 0.6650314148453361,
"learning_rate": 3.972528615870483e-05,
"loss": 0.3917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3971402645111084,
"step": 600,
"valid_targets_mean": 2811.0,
"valid_targets_min": 747
},
{
"epoch": 1.043103448275862,
"grad_norm": 0.8885280375871449,
"learning_rate": 3.9710902738229354e-05,
"loss": 0.3824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4812260866165161,
"step": 605,
"valid_targets_mean": 1807.2,
"valid_targets_min": 838
},
{
"epoch": 1.0517241379310345,
"grad_norm": 0.8235174714216085,
"learning_rate": 3.9696155060244166e-05,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.527877688407898,
"step": 610,
"valid_targets_mean": 2185.9,
"valid_targets_min": 907
},
{
"epoch": 1.0603448275862069,
"grad_norm": 0.6243759540097059,
"learning_rate": 3.968104339728636e-05,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3239450454711914,
"step": 615,
"valid_targets_mean": 2600.6,
"valid_targets_min": 511
},
{
"epoch": 1.0689655172413792,
"grad_norm": 0.8320317076108008,
"learning_rate": 3.966556802861951e-05,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4784361720085144,
"step": 620,
"valid_targets_mean": 2049.8,
"valid_targets_min": 643
},
{
"epoch": 1.0775862068965518,
"grad_norm": 0.7676936416325113,
"learning_rate": 3.964972924022843e-05,
"loss": 0.4245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45696157217025757,
"step": 625,
"valid_targets_mean": 2586.2,
"valid_targets_min": 798
},
{
"epoch": 1.0862068965517242,
"grad_norm": 0.7315583973749349,
"learning_rate": 3.963352732481396e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49207547307014465,
"step": 630,
"valid_targets_mean": 2997.6,
"valid_targets_min": 511
},
{
"epoch": 1.0948275862068966,
"grad_norm": 0.6524701307936455,
"learning_rate": 3.961696258178752e-05,
"loss": 0.4073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3828135132789612,
"step": 635,
"valid_targets_mean": 3398.6,
"valid_targets_min": 425
},
{
"epoch": 1.103448275862069,
"grad_norm": 0.6371602051142804,
"learning_rate": 3.960003531726559e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3406589925289154,
"step": 640,
"valid_targets_mean": 3585.0,
"valid_targets_min": 405
},
{
"epoch": 1.1120689655172413,
"grad_norm": 0.5890368242311975,
"learning_rate": 3.958274584406403e-05,
"loss": 0.4336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33770039677619934,
"step": 645,
"valid_targets_mean": 3216.1,
"valid_targets_min": 709
},
{
"epoch": 1.1206896551724137,
"grad_norm": 0.7050319619089337,
"learning_rate": 3.956509448169233e-05,
"loss": 0.4048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3342927098274231,
"step": 650,
"valid_targets_mean": 2537.4,
"valid_targets_min": 445
},
{
"epoch": 1.1293103448275863,
"grad_norm": 0.7624278995803477,
"learning_rate": 3.9547081556347693e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42083901166915894,
"step": 655,
"valid_targets_mean": 2359.4,
"valid_targets_min": 607
},
{
"epoch": 1.1379310344827587,
"grad_norm": 0.8322591973207496,
"learning_rate": 3.952870740090901e-05,
"loss": 0.413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29296737909317017,
"step": 660,
"valid_targets_mean": 1606.6,
"valid_targets_min": 538
},
{
"epoch": 1.146551724137931,
"grad_norm": 0.9566943537898349,
"learning_rate": 3.950997235493069e-05,
"loss": 0.3897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3879561722278595,
"step": 665,
"valid_targets_mean": 1809.0,
"valid_targets_min": 675
},
{
"epoch": 1.1551724137931034,
"grad_norm": 0.8626141996861321,
"learning_rate": 3.9490876764636414e-05,
"loss": 0.4095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3392297327518463,
"step": 670,
"valid_targets_mean": 2330.3,
"valid_targets_min": 583
},
{
"epoch": 1.1637931034482758,
"grad_norm": 0.798327566418468,
"learning_rate": 3.947142098291272e-05,
"loss": 0.3831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3780513405799866,
"step": 675,
"valid_targets_mean": 1909.8,
"valid_targets_min": 848
},
{
"epoch": 1.1724137931034484,
"grad_norm": 0.7799978912543006,
"learning_rate": 3.945160536930247e-05,
"loss": 0.3948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38355159759521484,
"step": 680,
"valid_targets_mean": 1956.6,
"valid_targets_min": 462
},
{
"epoch": 1.1810344827586208,
"grad_norm": 0.7170303781637705,
"learning_rate": 3.9431430289998235e-05,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41659241914749146,
"step": 685,
"valid_targets_mean": 2568.3,
"valid_targets_min": 907
},
{
"epoch": 1.1896551724137931,
"grad_norm": 0.75541871927773,
"learning_rate": 3.941089611783551e-05,
"loss": 0.4384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5742608904838562,
"step": 690,
"valid_targets_mean": 3480.9,
"valid_targets_min": 795
},
{
"epoch": 1.1982758620689655,
"grad_norm": 0.7273236482011581,
"learning_rate": 3.939000323228583e-05,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3808523416519165,
"step": 695,
"valid_targets_mean": 2336.6,
"valid_targets_min": 828
},
{
"epoch": 1.206896551724138,
"grad_norm": 0.7744304859786367,
"learning_rate": 3.9368752019449744e-05,
"loss": 0.4469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46578434109687805,
"step": 700,
"valid_targets_mean": 2492.6,
"valid_targets_min": 765
},
{
"epoch": 1.2155172413793103,
"grad_norm": 0.6368586747092351,
"learning_rate": 3.934714287204969e-05,
"loss": 0.3956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3132917881011963,
"step": 705,
"valid_targets_mean": 2797.6,
"valid_targets_min": 451
},
{
"epoch": 1.2241379310344827,
"grad_norm": 0.7193926603705026,
"learning_rate": 3.932517618942275e-05,
"loss": 0.4363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49011844396591187,
"step": 710,
"valid_targets_mean": 2756.4,
"valid_targets_min": 549
},
{
"epoch": 1.2327586206896552,
"grad_norm": 0.8222090867667902,
"learning_rate": 3.930285237751324e-05,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3633798360824585,
"step": 715,
"valid_targets_mean": 2080.2,
"valid_targets_min": 574
},
{
"epoch": 1.2413793103448276,
"grad_norm": 0.6879632039050765,
"learning_rate": 3.928017184886525e-05,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3634766936302185,
"step": 720,
"valid_targets_mean": 2422.1,
"valid_targets_min": 442
},
{
"epoch": 1.25,
"grad_norm": 0.669091661082806,
"learning_rate": 3.925713502261496e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4206310510635376,
"step": 725,
"valid_targets_mean": 2847.8,
"valid_targets_min": 661
},
{
"epoch": 1.2586206896551724,
"grad_norm": 0.7599239264639392,
"learning_rate": 3.9233742324482965e-05,
"loss": 0.3671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45150965452194214,
"step": 730,
"valid_targets_mean": 3899.8,
"valid_targets_min": 470
},
{
"epoch": 1.2672413793103448,
"grad_norm": 0.8458728794370647,
"learning_rate": 3.920999418676636e-05,
"loss": 0.4012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3931143879890442,
"step": 735,
"valid_targets_mean": 1709.2,
"valid_targets_min": 735
},
{
"epoch": 1.2758620689655173,
"grad_norm": 0.7894601441756182,
"learning_rate": 3.918589104833075e-05,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5081537961959839,
"step": 740,
"valid_targets_mean": 2482.3,
"valid_targets_min": 481
},
{
"epoch": 1.2844827586206897,
"grad_norm": 0.8608351924274511,
"learning_rate": 3.916143335460218e-05,
"loss": 0.4317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.375831663608551,
"step": 745,
"valid_targets_mean": 1595.8,
"valid_targets_min": 612
},
{
"epoch": 1.293103448275862,
"grad_norm": 0.6124934646738293,
"learning_rate": 3.913662155755885e-05,
"loss": 0.4397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48569154739379883,
"step": 750,
"valid_targets_mean": 4658.1,
"valid_targets_min": 599
},
{
"epoch": 1.3017241379310345,
"grad_norm": 0.6136863641105471,
"learning_rate": 3.911145611572282e-05,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40924838185310364,
"step": 755,
"valid_targets_mean": 3167.8,
"valid_targets_min": 626
},
{
"epoch": 1.3103448275862069,
"grad_norm": 0.7193681878175996,
"learning_rate": 3.908593749415148e-05,
"loss": 0.4629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48019519448280334,
"step": 760,
"valid_targets_mean": 2553.4,
"valid_targets_min": 622
},
{
"epoch": 1.3189655172413794,
"grad_norm": 0.6821922155446412,
"learning_rate": 3.9060066164428986e-05,
"loss": 0.3818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4456404745578766,
"step": 765,
"valid_targets_mean": 3264.4,
"valid_targets_min": 599
},
{
"epoch": 1.3275862068965516,
"grad_norm": 0.6012395192250871,
"learning_rate": 3.903384260465756e-05,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192451596260071,
"step": 770,
"valid_targets_mean": 2788.5,
"valid_targets_min": 868
},
{
"epoch": 1.3362068965517242,
"grad_norm": 0.7545058489849539,
"learning_rate": 3.900726729944861e-05,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47883346676826477,
"step": 775,
"valid_targets_mean": 2500.5,
"valid_targets_min": 612
},
{
"epoch": 1.3448275862068966,
"grad_norm": 0.6398010325865217,
"learning_rate": 3.898034073991382e-05,
"loss": 0.4135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4672417640686035,
"step": 780,
"valid_targets_mean": 3337.8,
"valid_targets_min": 1059
},
{
"epoch": 1.353448275862069,
"grad_norm": 0.7940809550754068,
"learning_rate": 3.8953063423656055e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42937517166137695,
"step": 785,
"valid_targets_mean": 2104.6,
"valid_targets_min": 608
},
{
"epoch": 1.3620689655172413,
"grad_norm": 0.711072268408022,
"learning_rate": 3.892543585476014e-05,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4857082962989807,
"step": 790,
"valid_targets_mean": 2814.8,
"valid_targets_min": 512
},
{
"epoch": 1.3706896551724137,
"grad_norm": 0.7932387173216984,
"learning_rate": 3.88974585437836e-05,
"loss": 0.4337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5068721175193787,
"step": 795,
"valid_targets_mean": 3371.6,
"valid_targets_min": 519
},
{
"epoch": 1.3793103448275863,
"grad_norm": 0.7379868428248753,
"learning_rate": 3.886913200774717e-05,
"loss": 0.3736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39806318283081055,
"step": 800,
"valid_targets_mean": 2662.9,
"valid_targets_min": 669
},
{
"epoch": 1.3879310344827587,
"grad_norm": 0.9372146576345584,
"learning_rate": 3.884045677012528e-05,
"loss": 0.4324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43995919823646545,
"step": 805,
"valid_targets_mean": 1663.8,
"valid_targets_min": 681
},
{
"epoch": 1.396551724137931,
"grad_norm": 0.757584914847117,
"learning_rate": 3.8811433360836364e-05,
"loss": 0.4064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39269834756851196,
"step": 810,
"valid_targets_mean": 2236.2,
"valid_targets_min": 534
},
{
"epoch": 1.4051724137931034,
"grad_norm": 0.5602666343134688,
"learning_rate": 3.878206231623306e-05,
"loss": 0.4291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34488746523857117,
"step": 815,
"valid_targets_mean": 3282.4,
"valid_targets_min": 485
},
{
"epoch": 1.4137931034482758,
"grad_norm": 0.8360209814458835,
"learning_rate": 3.8752344179092315e-05,
"loss": 0.4534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6250336170196533,
"step": 820,
"valid_targets_mean": 3202.9,
"valid_targets_min": 807
},
{
"epoch": 1.4224137931034484,
"grad_norm": 0.6716355795895128,
"learning_rate": 3.8722279498605344e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34475111961364746,
"step": 825,
"valid_targets_mean": 2427.8,
"valid_targets_min": 412
},
{
"epoch": 1.4310344827586206,
"grad_norm": 0.7510883988029478,
"learning_rate": 3.869186883036748e-05,
"loss": 0.4027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42797213792800903,
"step": 830,
"valid_targets_mean": 2374.5,
"valid_targets_min": 554
},
{
"epoch": 1.4396551724137931,
"grad_norm": 0.7944589287393519,
"learning_rate": 3.8661112736367924e-05,
"loss": 0.4036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38339388370513916,
"step": 835,
"valid_targets_mean": 2018.9,
"valid_targets_min": 590
},
{
"epoch": 1.4482758620689655,
"grad_norm": 0.6465050270956495,
"learning_rate": 3.863001178497933e-05,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5302772521972656,
"step": 840,
"valid_targets_mean": 4361.5,
"valid_targets_min": 282
},
{
"epoch": 1.456896551724138,
"grad_norm": 0.6893879526286418,
"learning_rate": 3.8598566550947316e-05,
"loss": 0.3881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4017932415008545,
"step": 845,
"valid_targets_mean": 2625.7,
"valid_targets_min": 613
},
{
"epoch": 1.4655172413793103,
"grad_norm": 0.6220088023463586,
"learning_rate": 3.856677761537986e-05,
"loss": 0.4021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36116647720336914,
"step": 850,
"valid_targets_mean": 3468.6,
"valid_targets_min": 715
},
{
"epoch": 1.4741379310344827,
"grad_norm": 0.7694318201664595,
"learning_rate": 3.853464556573652e-05,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.380726158618927,
"step": 855,
"valid_targets_mean": 2097.6,
"valid_targets_min": 625
},
{
"epoch": 1.4827586206896552,
"grad_norm": 0.7201246052401616,
"learning_rate": 3.850217099581764e-05,
"loss": 0.396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46923041343688965,
"step": 860,
"valid_targets_mean": 2454.4,
"valid_targets_min": 704
},
{
"epoch": 1.4913793103448276,
"grad_norm": 0.7112727683269261,
"learning_rate": 3.8469354505753305e-05,
"loss": 0.3623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3220486044883728,
"step": 865,
"valid_targets_mean": 2655.5,
"valid_targets_min": 510
},
{
"epoch": 1.5,
"grad_norm": 0.6213614398189481,
"learning_rate": 3.843619670199229e-05,
"loss": 0.3986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33441856503486633,
"step": 870,
"valid_targets_mean": 2729.1,
"valid_targets_min": 543
},
{
"epoch": 1.5086206896551724,
"grad_norm": 0.7534771914043414,
"learning_rate": 3.8402698197290865e-05,
"loss": 0.4389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46794092655181885,
"step": 875,
"valid_targets_mean": 3115.1,
"valid_targets_min": 937
},
{
"epoch": 1.5172413793103448,
"grad_norm": 0.6724604582524113,
"learning_rate": 3.8368859610701443e-05,
"loss": 0.4321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5096204280853271,
"step": 880,
"valid_targets_mean": 3365.1,
"valid_targets_min": 703
},
{
"epoch": 1.5258620689655173,
"grad_norm": 0.537324077917551,
"learning_rate": 3.833468156756114e-05,
"loss": 0.3699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39847302436828613,
"step": 885,
"valid_targets_mean": 4028.4,
"valid_targets_min": 352
},
{
"epoch": 1.5344827586206895,
"grad_norm": 0.7701273286666982,
"learning_rate": 3.8300164699480246e-05,
"loss": 0.4074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3641321361064911,
"step": 890,
"valid_targets_mean": 1731.1,
"valid_targets_min": 578
},
{
"epoch": 1.543103448275862,
"grad_norm": 0.6768973576564309,
"learning_rate": 3.8265309644330535e-05,
"loss": 0.3796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40518438816070557,
"step": 895,
"valid_targets_mean": 3067.6,
"valid_targets_min": 653
},
{
"epoch": 1.5517241379310345,
"grad_norm": 0.8375219158955782,
"learning_rate": 3.823011704623347e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.400987446308136,
"step": 900,
"valid_targets_mean": 1611.2,
"valid_targets_min": 611
},
{
"epoch": 1.5603448275862069,
"grad_norm": 0.8211855004487335,
"learning_rate": 3.81945875555483e-05,
"loss": 0.4045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39641138911247253,
"step": 905,
"valid_targets_mean": 1993.6,
"valid_targets_min": 759
},
{
"epoch": 1.5689655172413794,
"grad_norm": 0.8218745944898366,
"learning_rate": 3.8158721828860094e-05,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34812313318252563,
"step": 910,
"valid_targets_mean": 1692.9,
"valid_targets_min": 609
},
{
"epoch": 1.5775862068965516,
"grad_norm": 0.7720513032419637,
"learning_rate": 3.81225205289675e-05,
"loss": 0.4902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4618193507194519,
"step": 915,
"valid_targets_mean": 1989.4,
"valid_targets_min": 660
},
{
"epoch": 1.5862068965517242,
"grad_norm": 0.7623625823563448,
"learning_rate": 3.808598432487061e-05,
"loss": 0.4345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36552631855010986,
"step": 920,
"valid_targets_mean": 1844.8,
"valid_targets_min": 555
},
{
"epoch": 1.5948275862068966,
"grad_norm": 0.6438978080095269,
"learning_rate": 3.8049113891758506e-05,
"loss": 0.4502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39778804779052734,
"step": 925,
"valid_targets_mean": 2994.9,
"valid_targets_min": 643
},
{
"epoch": 1.603448275862069,
"grad_norm": 0.7649241814152833,
"learning_rate": 3.8011909910996856e-05,
"loss": 0.3747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43716567754745483,
"step": 930,
"valid_targets_mean": 2140.6,
"valid_targets_min": 607
},
{
"epoch": 1.6120689655172413,
"grad_norm": 0.580587049117197,
"learning_rate": 3.797437307011527e-05,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35338088870048523,
"step": 935,
"valid_targets_mean": 3349.8,
"valid_targets_min": 567
},
{
"epoch": 1.6206896551724137,
"grad_norm": 0.7312067736555172,
"learning_rate": 3.793650406279463e-05,
"loss": 0.4217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40459704399108887,
"step": 940,
"valid_targets_mean": 1908.5,
"valid_targets_min": 664
},
{
"epoch": 1.6293103448275863,
"grad_norm": 0.8452807897938808,
"learning_rate": 3.789830358885423e-05,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42247670888900757,
"step": 945,
"valid_targets_mean": 1825.6,
"valid_targets_min": 640
},
{
"epoch": 1.6379310344827587,
"grad_norm": 0.6507520907626049,
"learning_rate": 3.7859772354238885e-05,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28464314341545105,
"step": 950,
"valid_targets_mean": 2569.2,
"valid_targets_min": 569
},
{
"epoch": 1.646551724137931,
"grad_norm": 0.7658684085183802,
"learning_rate": 3.782091107100587e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4443947970867157,
"step": 955,
"valid_targets_mean": 2170.6,
"valid_targets_min": 814
},
{
"epoch": 1.6551724137931034,
"grad_norm": 1.2494001805866435,
"learning_rate": 3.7781720457311746e-05,
"loss": 0.4166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5146511793136597,
"step": 960,
"valid_targets_mean": 2532.3,
"valid_targets_min": 530
},
{
"epoch": 1.6637931034482758,
"grad_norm": 0.6526502409039252,
"learning_rate": 3.7742201237399105e-05,
"loss": 0.4514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34717223048210144,
"step": 965,
"valid_targets_mean": 3003.6,
"valid_targets_min": 931
},
{
"epoch": 1.6724137931034484,
"grad_norm": 0.633402843925448,
"learning_rate": 3.77023541415832e-05,
"loss": 0.3931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34919875860214233,
"step": 970,
"valid_targets_mean": 2739.6,
"valid_targets_min": 753
},
{
"epoch": 1.6810344827586206,
"grad_norm": 0.8387142971624745,
"learning_rate": 3.7662179906238405e-05,
"loss": 0.4068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40993672609329224,
"step": 975,
"valid_targets_mean": 2246.9,
"valid_targets_min": 708
},
{
"epoch": 1.6896551724137931,
"grad_norm": 0.5085763777226048,
"learning_rate": 3.762167927378464e-05,
"loss": 0.3599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33271750807762146,
"step": 980,
"valid_targets_mean": 4219.9,
"valid_targets_min": 515
},
{
"epoch": 1.6982758620689655,
"grad_norm": 0.8224745860109742,
"learning_rate": 3.7580852992673656e-05,
"loss": 0.392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3762546479701996,
"step": 985,
"valid_targets_mean": 1791.2,
"valid_targets_min": 399
},
{
"epoch": 1.706896551724138,
"grad_norm": 0.5920143777699354,
"learning_rate": 3.7539701817375185e-05,
"loss": 0.3932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3287311792373657,
"step": 990,
"valid_targets_mean": 3017.8,
"valid_targets_min": 572
},
{
"epoch": 1.7155172413793105,
"grad_norm": 0.5939374862414969,
"learning_rate": 3.7498226508362996e-05,
"loss": 0.4305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27790141105651855,
"step": 995,
"valid_targets_mean": 2668.7,
"valid_targets_min": 630
},
{
"epoch": 1.7241379310344827,
"grad_norm": 0.6941009800354047,
"learning_rate": 3.7456427832100864e-05,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.491094708442688,
"step": 1000,
"valid_targets_mean": 4933.6,
"valid_targets_min": 427
},
{
"epoch": 1.7327586206896552,
"grad_norm": 0.6943581356651782,
"learning_rate": 3.7414306561028385e-05,
"loss": 0.4164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4229108393192291,
"step": 1005,
"valid_targets_mean": 2461.8,
"valid_targets_min": 593
},
{
"epoch": 1.7413793103448276,
"grad_norm": 0.8064131925426529,
"learning_rate": 3.73718634735467e-05,
"loss": 0.4169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45140957832336426,
"step": 1010,
"valid_targets_mean": 2074.4,
"valid_targets_min": 393
},
{
"epoch": 1.75,
"grad_norm": 0.6813330765539505,
"learning_rate": 3.732909935400412e-05,
"loss": 0.3606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3701205253601074,
"step": 1015,
"valid_targets_mean": 3159.4,
"valid_targets_min": 750
},
{
"epoch": 1.7586206896551724,
"grad_norm": 0.6288867610404782,
"learning_rate": 3.7286014992681645e-05,
"loss": 0.3841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3469887375831604,
"step": 1020,
"valid_targets_mean": 2883.7,
"valid_targets_min": 535
},
{
"epoch": 1.7672413793103448,
"grad_norm": 0.7143527167015993,
"learning_rate": 3.7242611185778325e-05,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39058348536491394,
"step": 1025,
"valid_targets_mean": 3864.4,
"valid_targets_min": 578
},
{
"epoch": 1.7758620689655173,
"grad_norm": 0.5703494416813504,
"learning_rate": 3.7198888735396574e-05,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.342609703540802,
"step": 1030,
"valid_targets_mean": 3531.6,
"valid_targets_min": 589
},
{
"epoch": 1.7844827586206895,
"grad_norm": 0.6952050006138021,
"learning_rate": 3.7154848449527334e-05,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4868992567062378,
"step": 1035,
"valid_targets_mean": 2866.4,
"valid_targets_min": 657
},
{
"epoch": 1.793103448275862,
"grad_norm": 0.6282722343659998,
"learning_rate": 3.7110491142035145e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3678615093231201,
"step": 1040,
"valid_targets_mean": 3136.4,
"valid_targets_min": 524
},
{
"epoch": 1.8017241379310345,
"grad_norm": 0.5812176719759966,
"learning_rate": 3.7065817632643115e-05,
"loss": 0.3729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3459870517253876,
"step": 1045,
"valid_targets_mean": 3125.9,
"valid_targets_min": 664
},
{
"epoch": 1.8103448275862069,
"grad_norm": 0.7052883776391125,
"learning_rate": 3.702082874691776e-05,
"loss": 0.3779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3673224449157715,
"step": 1050,
"valid_targets_mean": 2189.1,
"valid_targets_min": 879
},
{
"epoch": 1.8189655172413794,
"grad_norm": 0.6973382773007308,
"learning_rate": 3.6975525316253744e-05,
"loss": 0.4054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34974607825279236,
"step": 1055,
"valid_targets_mean": 2217.2,
"valid_targets_min": 741
},
{
"epoch": 1.8275862068965516,
"grad_norm": 0.7266969496321424,
"learning_rate": 3.692990817785853e-05,
"loss": 0.3681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42130789160728455,
"step": 1060,
"valid_targets_mean": 2347.6,
"valid_targets_min": 583
},
{
"epoch": 1.8362068965517242,
"grad_norm": 0.8676321505533798,
"learning_rate": 3.68839781747369e-05,
"loss": 0.3863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45284566283226013,
"step": 1065,
"valid_targets_mean": 1771.2,
"valid_targets_min": 617
},
{
"epoch": 1.8448275862068966,
"grad_norm": 0.6589301963607709,
"learning_rate": 3.683773615567538e-05,
"loss": 0.3954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3539057970046997,
"step": 1070,
"valid_targets_mean": 2677.9,
"valid_targets_min": 558
},
{
"epoch": 1.853448275862069,
"grad_norm": 0.6167457014344452,
"learning_rate": 3.679118297522654e-05,
"loss": 0.4454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4817582666873932,
"step": 1075,
"valid_targets_mean": 4339.6,
"valid_targets_min": 377
},
{
"epoch": 1.8620689655172413,
"grad_norm": 0.6055737080045898,
"learning_rate": 3.674431949369321e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.393863320350647,
"step": 1080,
"valid_targets_mean": 3241.9,
"valid_targets_min": 492
},
{
"epoch": 1.8706896551724137,
"grad_norm": 0.7354615943580206,
"learning_rate": 3.6697146577112614e-05,
"loss": 0.3936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38788315653800964,
"step": 1085,
"valid_targets_mean": 2015.6,
"valid_targets_min": 431
},
{
"epoch": 1.8793103448275863,
"grad_norm": 0.5760016126037003,
"learning_rate": 3.6649665097240304e-05,
"loss": 0.3942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40716418623924255,
"step": 1090,
"valid_targets_mean": 4327.3,
"valid_targets_min": 551
},
{
"epoch": 1.8879310344827587,
"grad_norm": 0.8615793077201944,
"learning_rate": 3.660187593153408e-05,
"loss": 0.3816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43805018067359924,
"step": 1095,
"valid_targets_mean": 1688.0,
"valid_targets_min": 656
},
{
"epoch": 1.896551724137931,
"grad_norm": 0.7457791465766714,
"learning_rate": 3.655377996313782e-05,
"loss": 0.4069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4772360324859619,
"step": 1100,
"valid_targets_mean": 2212.9,
"valid_targets_min": 575
},
{
"epoch": 1.9051724137931034,
"grad_norm": 0.8291844822006753,
"learning_rate": 3.6505378080865054e-05,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39961403608322144,
"step": 1105,
"valid_targets_mean": 1644.9,
"valid_targets_min": 479
},
{
"epoch": 1.9137931034482758,
"grad_norm": 0.6199256600700211,
"learning_rate": 3.645667117918265e-05,
"loss": 0.4192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3381462097167969,
"step": 1110,
"valid_targets_mean": 2744.1,
"valid_targets_min": 645
},
{
"epoch": 1.9224137931034484,
"grad_norm": 0.5746653636562877,
"learning_rate": 3.640766015819423e-05,
"loss": 0.4441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.423374205827713,
"step": 1115,
"valid_targets_mean": 3882.1,
"valid_targets_min": 818
},
{
"epoch": 1.9310344827586206,
"grad_norm": 0.6329881260544258,
"learning_rate": 3.6358345923623506e-05,
"loss": 0.3768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3031822443008423,
"step": 1120,
"valid_targets_mean": 2636.6,
"valid_targets_min": 560
},
{
"epoch": 1.9396551724137931,
"grad_norm": 0.6746260613469616,
"learning_rate": 3.630872938679761e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3765380382537842,
"step": 1125,
"valid_targets_mean": 2744.8,
"valid_targets_min": 686
},
{
"epoch": 1.9482758620689655,
"grad_norm": 0.740987702919496,
"learning_rate": 3.6258811464630215e-05,
"loss": 0.4098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42373108863830566,
"step": 1130,
"valid_targets_mean": 2425.2,
"valid_targets_min": 432
},
{
"epoch": 1.956896551724138,
"grad_norm": 1.1924553665440873,
"learning_rate": 3.620859307960458e-05,
"loss": 0.4763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3285548686981201,
"step": 1135,
"valid_targets_mean": 2777.8,
"valid_targets_min": 606
},
{
"epoch": 1.9655172413793105,
"grad_norm": 0.8258503182816348,
"learning_rate": 3.615807515975654e-05,
"loss": 0.3811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43213579058647156,
"step": 1140,
"valid_targets_mean": 2270.6,
"valid_targets_min": 535
},
{
"epoch": 1.9741379310344827,
"grad_norm": 0.6833220821483821,
"learning_rate": 3.6107258638657324e-05,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122459948062897,
"step": 1145,
"valid_targets_mean": 4119.2,
"valid_targets_min": 731
},
{
"epoch": 1.9827586206896552,
"grad_norm": 0.5830920412565893,
"learning_rate": 3.60561444553963e-05,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3681791424751282,
"step": 1150,
"valid_targets_mean": 3160.9,
"valid_targets_min": 961
},
{
"epoch": 1.9913793103448276,
"grad_norm": 0.6162725013998724,
"learning_rate": 3.600473355456366e-05,
"loss": 0.3904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34768128395080566,
"step": 1155,
"valid_targets_mean": 3020.3,
"valid_targets_min": 637
},
{
"epoch": 2.0,
"grad_norm": 0.7220829440099563,
"learning_rate": 3.595302688623291e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4216357171535492,
"step": 1160,
"valid_targets_mean": 2232.6,
"valid_targets_min": 503
},
{
"epoch": 2.0086206896551726,
"grad_norm": 0.5388192966250313,
"learning_rate": 3.590102540594337e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30984219908714294,
"step": 1165,
"valid_targets_mean": 3784.2,
"valid_targets_min": 435
},
{
"epoch": 2.0172413793103448,
"grad_norm": 0.8860377930426859,
"learning_rate": 3.584873007468244e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3425954580307007,
"step": 1170,
"valid_targets_mean": 1921.7,
"valid_targets_min": 736
},
{
"epoch": 2.0258620689655173,
"grad_norm": 0.8903193161432715,
"learning_rate": 3.5796141858867935e-05,
"loss": 0.3589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3836989998817444,
"step": 1175,
"valid_targets_mean": 1732.9,
"valid_targets_min": 635
},
{
"epoch": 2.0344827586206895,
"grad_norm": 0.6655554260518024,
"learning_rate": 3.5743261730330144e-05,
"loss": 0.3388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3734143376350403,
"step": 1180,
"valid_targets_mean": 3244.6,
"valid_targets_min": 1242
},
{
"epoch": 2.043103448275862,
"grad_norm": 0.6589382550025945,
"learning_rate": 3.569009066629392e-05,
"loss": 0.3406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3362818956375122,
"step": 1185,
"valid_targets_mean": 3155.6,
"valid_targets_min": 839
},
{
"epoch": 2.0517241379310347,
"grad_norm": 0.6918050697024621,
"learning_rate": 3.56366296493606e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3342352509498596,
"step": 1190,
"valid_targets_mean": 2828.1,
"valid_targets_min": 589
},
{
"epoch": 2.060344827586207,
"grad_norm": 0.5940371066958855,
"learning_rate": 3.558287966748985e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669927477836609,
"step": 1195,
"valid_targets_mean": 3061.4,
"valid_targets_min": 690
},
{
"epoch": 2.0689655172413794,
"grad_norm": 0.7643289898339554,
"learning_rate": 3.552884171398141e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4045037031173706,
"step": 1200,
"valid_targets_mean": 2579.3,
"valid_targets_min": 535
},
{
"epoch": 2.0775862068965516,
"grad_norm": 0.7255326164964023,
"learning_rate": 3.547451678745673e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39175868034362793,
"step": 1205,
"valid_targets_mean": 2542.5,
"valid_targets_min": 758
},
{
"epoch": 2.086206896551724,
"grad_norm": 0.6060718767054583,
"learning_rate": 3.541990589184053e-05,
"loss": 0.3874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4336078464984894,
"step": 1210,
"valid_targets_mean": 3638.5,
"valid_targets_min": 610
},
{
"epoch": 2.0948275862068964,
"grad_norm": 0.6766990332271949,
"learning_rate": 3.5365010036342245e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32076266407966614,
"step": 1215,
"valid_targets_mean": 2834.5,
"valid_targets_min": 514
},
{
"epoch": 2.103448275862069,
"grad_norm": 0.5734779038893596,
"learning_rate": 3.530983023543734e-05,
"loss": 0.344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31001657247543335,
"step": 1220,
"valid_targets_mean": 3574.9,
"valid_targets_min": 901
},
{
"epoch": 2.1120689655172415,
"grad_norm": 0.7199219118404978,
"learning_rate": 3.525436750884863e-05,
"loss": 0.3505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31847256422042847,
"step": 1225,
"valid_targets_mean": 2214.8,
"valid_targets_min": 616
},
{
"epoch": 2.1206896551724137,
"grad_norm": 0.6319108730231816,
"learning_rate": 3.5198622881527374e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28605881333351135,
"step": 1230,
"valid_targets_mean": 3245.0,
"valid_targets_min": 652
},
{
"epoch": 2.1293103448275863,
"grad_norm": 0.7995321706961999,
"learning_rate": 3.514259738363436e-05,
"loss": 0.3408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3353400230407715,
"step": 1235,
"valid_targets_mean": 2027.1,
"valid_targets_min": 820
},
{
"epoch": 2.1379310344827585,
"grad_norm": 0.9179748361646247,
"learning_rate": 3.5086292050520855e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39520493149757385,
"step": 1240,
"valid_targets_mean": 1937.8,
"valid_targets_min": 395
},
{
"epoch": 2.146551724137931,
"grad_norm": 0.746855498744147,
"learning_rate": 3.502970792270951e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3741573393344879,
"step": 1245,
"valid_targets_mean": 2679.6,
"valid_targets_min": 692
},
{
"epoch": 2.1551724137931036,
"grad_norm": 0.5754114961452039,
"learning_rate": 3.497284604587508e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3210458755493164,
"step": 1250,
"valid_targets_mean": 3502.5,
"valid_targets_min": 621
},
{
"epoch": 2.163793103448276,
"grad_norm": 0.7426374111463406,
"learning_rate": 3.491570747082512e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2950843274593353,
"step": 1255,
"valid_targets_mean": 2185.5,
"valid_targets_min": 748
},
{
"epoch": 2.1724137931034484,
"grad_norm": 1.8569462813349802,
"learning_rate": 3.485829325348059e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4585845470428467,
"step": 1260,
"valid_targets_mean": 2958.1,
"valid_targets_min": 531
},
{
"epoch": 2.1810344827586206,
"grad_norm": 0.6461462169152513,
"learning_rate": 3.4800604454856284e-05,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35911306738853455,
"step": 1265,
"valid_targets_mean": 2807.1,
"valid_targets_min": 640
},
{
"epoch": 2.189655172413793,
"grad_norm": 0.8080624401623676,
"learning_rate": 3.47426421410413e-05,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31265851855278015,
"step": 1270,
"valid_targets_mean": 2058.2,
"valid_targets_min": 848
},
{
"epoch": 2.1982758620689653,
"grad_norm": 0.6467103643654887,
"learning_rate": 3.468440738317926e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3470854163169861,
"step": 1275,
"valid_targets_mean": 3573.7,
"valid_targets_min": 957
},
{
"epoch": 2.206896551724138,
"grad_norm": 0.7060195928575449,
"learning_rate": 3.4625901257448596e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3791043758392334,
"step": 1280,
"valid_targets_mean": 2588.9,
"valid_targets_min": 690
},
{
"epoch": 2.2155172413793105,
"grad_norm": 0.8796348183577576,
"learning_rate": 3.4567124845042564e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27518510818481445,
"step": 1285,
"valid_targets_mean": 1862.4,
"valid_targets_min": 424
},
{
"epoch": 2.2241379310344827,
"grad_norm": 0.9628728050045314,
"learning_rate": 3.4508079232149354e-05,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4080553352832794,
"step": 1290,
"valid_targets_mean": 1559.8,
"valid_targets_min": 551
},
{
"epoch": 2.2327586206896552,
"grad_norm": 0.7472287967147371,
"learning_rate": 3.444876550993198e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33648034930229187,
"step": 1295,
"valid_targets_mean": 2121.4,
"valid_targets_min": 560
},
{
"epoch": 2.2413793103448274,
"grad_norm": 0.5763763906754586,
"learning_rate": 3.4389184774508105e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3669682741165161,
"step": 1300,
"valid_targets_mean": 3822.4,
"valid_targets_min": 908
},
{
"epoch": 2.25,
"grad_norm": 0.8021437893371579,
"learning_rate": 3.43293381269298e-05,
"loss": 0.3623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3201998174190521,
"step": 1305,
"valid_targets_mean": 2141.8,
"valid_targets_min": 569
},
{
"epoch": 2.2586206896551726,
"grad_norm": 0.7305450212853413,
"learning_rate": 3.4269226673163204e-05,
"loss": 0.381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47764334082603455,
"step": 1310,
"valid_targets_mean": 3005.6,
"valid_targets_min": 579
},
{
"epoch": 2.2672413793103448,
"grad_norm": 0.8083273631520955,
"learning_rate": 3.420885152406805e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3901101052761078,
"step": 1315,
"valid_targets_mean": 2275.4,
"valid_targets_min": 506
},
{
"epoch": 2.2758620689655173,
"grad_norm": 0.8109990424140212,
"learning_rate": 3.4148213795377194e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37412458658218384,
"step": 1320,
"valid_targets_mean": 2063.2,
"valid_targets_min": 488
},
{
"epoch": 2.2844827586206895,
"grad_norm": 0.7476899330396594,
"learning_rate": 3.408731460767593e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29301315546035767,
"step": 1325,
"valid_targets_mean": 2032.8,
"valid_targets_min": 477
},
{
"epoch": 2.293103448275862,
"grad_norm": 0.7384812273892642,
"learning_rate": 3.402615508638134e-05,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4986970126628876,
"step": 1330,
"valid_targets_mean": 2887.1,
"valid_targets_min": 1171
},
{
"epoch": 2.3017241379310347,
"grad_norm": 0.7052675589889301,
"learning_rate": 3.396473636172146e-05,
"loss": 0.3765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3002275824546814,
"step": 1335,
"valid_targets_mean": 2545.4,
"valid_targets_min": 543
},
{
"epoch": 2.310344827586207,
"grad_norm": 0.5638329722524688,
"learning_rate": 3.3903059568714406e-05,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29387524724006653,
"step": 1340,
"valid_targets_mean": 3717.7,
"valid_targets_min": 569
},
{
"epoch": 2.3189655172413794,
"grad_norm": 0.7437822158482291,
"learning_rate": 3.384112584714739e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086732029914856,
"step": 1345,
"valid_targets_mean": 2345.1,
"valid_targets_min": 493
},
{
"epoch": 2.3275862068965516,
"grad_norm": 0.7665275506599184,
"learning_rate": 3.377893634155568e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3466002345085144,
"step": 1350,
"valid_targets_mean": 2198.2,
"valid_targets_min": 950
},
{
"epoch": 2.336206896551724,
"grad_norm": 0.6885948848323417,
"learning_rate": 3.371649220120143e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33025288581848145,
"step": 1355,
"valid_targets_mean": 2540.4,
"valid_targets_min": 575
},
{
"epoch": 2.344827586206897,
"grad_norm": 0.6702991821826371,
"learning_rate": 3.365379458005243e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3554913103580475,
"step": 1360,
"valid_targets_mean": 3490.3,
"valid_targets_min": 522
},
{
"epoch": 2.353448275862069,
"grad_norm": 0.7820230821530418,
"learning_rate": 3.35908446367608e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3224671185016632,
"step": 1365,
"valid_targets_mean": 2158.5,
"valid_targets_min": 905
},
{
"epoch": 2.3620689655172415,
"grad_norm": 0.5499398168119826,
"learning_rate": 3.35276435346416e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3069545030593872,
"step": 1370,
"valid_targets_mean": 3997.6,
"valid_targets_min": 718
},
{
"epoch": 2.3706896551724137,
"grad_norm": 0.6187347278761689,
"learning_rate": 3.346419244165127e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29844409227371216,
"step": 1375,
"valid_targets_mean": 3237.6,
"valid_targets_min": 549
},
{
"epoch": 2.3793103448275863,
"grad_norm": 0.7649535914549306,
"learning_rate": 3.3400492530366086e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3073192834854126,
"step": 1380,
"valid_targets_mean": 2159.3,
"valid_targets_min": 932
},
{
"epoch": 2.3879310344827585,
"grad_norm": 0.8065445997332823,
"learning_rate": 3.333654497796051e-05,
"loss": 0.4314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4503655433654785,
"step": 1385,
"valid_targets_mean": 2368.5,
"valid_targets_min": 479
},
{
"epoch": 2.396551724137931,
"grad_norm": 0.9539292555942607,
"learning_rate": 3.32723509661854e-05,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35420340299606323,
"step": 1390,
"valid_targets_mean": 1735.4,
"valid_targets_min": 544
},
{
"epoch": 2.405172413793103,
"grad_norm": 0.7435624854998906,
"learning_rate": 3.320791168134617e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867245078086853,
"step": 1395,
"valid_targets_mean": 2049.0,
"valid_targets_min": 605
},
{
"epoch": 2.413793103448276,
"grad_norm": 0.8410354465466265,
"learning_rate": 3.31432283142809e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4442535638809204,
"step": 1400,
"valid_targets_mean": 2262.7,
"valid_targets_min": 729
},
{
"epoch": 2.4224137931034484,
"grad_norm": 0.6903927781580114,
"learning_rate": 3.307830206033831e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3711048364639282,
"step": 1405,
"valid_targets_mean": 3179.2,
"valid_targets_min": 882
},
{
"epoch": 2.4310344827586206,
"grad_norm": 0.695084735647335,
"learning_rate": 3.301313411935565e-05,
"loss": 0.3563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3399720788002014,
"step": 1410,
"valid_targets_mean": 2799.4,
"valid_targets_min": 450
},
{
"epoch": 2.439655172413793,
"grad_norm": 0.7060158875096876,
"learning_rate": 3.294772569563656e-05,
"loss": 0.4188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4565882086753845,
"step": 1415,
"valid_targets_mean": 3125.3,
"valid_targets_min": 871
},
{
"epoch": 2.4482758620689653,
"grad_norm": 0.6993437246470752,
"learning_rate": 3.28820779979288e-05,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3832154870033264,
"step": 1420,
"valid_targets_mean": 3026.6,
"valid_targets_min": 798
},
{
"epoch": 2.456896551724138,
"grad_norm": 0.7671380866195133,
"learning_rate": 3.281619223940192e-05,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39568156003952026,
"step": 1425,
"valid_targets_mean": 3380.5,
"valid_targets_min": 409
},
{
"epoch": 2.4655172413793105,
"grad_norm": 0.883160039143343,
"learning_rate": 3.2750069637624826e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4419388771057129,
"step": 1430,
"valid_targets_mean": 1897.9,
"valid_targets_min": 712
},
{
"epoch": 2.4741379310344827,
"grad_norm": 0.7456455502612334,
"learning_rate": 3.2683711414543295e-05,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38482749462127686,
"step": 1435,
"valid_targets_mean": 2422.2,
"valid_targets_min": 774
},
{
"epoch": 2.4827586206896552,
"grad_norm": 0.6311742479799494,
"learning_rate": 3.261711879645737e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3681245744228363,
"step": 1440,
"valid_targets_mean": 3291.8,
"valid_targets_min": 431
},
{
"epoch": 2.4913793103448274,
"grad_norm": 0.9504806362945273,
"learning_rate": 3.255029301399873e-05,
"loss": 0.3541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3798632025718689,
"step": 1445,
"valid_targets_mean": 1594.6,
"valid_targets_min": 665
},
{
"epoch": 2.5,
"grad_norm": 0.8003715063056267,
"learning_rate": 3.248323530210793e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36555957794189453,
"step": 1450,
"valid_targets_mean": 1955.6,
"valid_targets_min": 674
},
{
"epoch": 2.5086206896551726,
"grad_norm": 0.7228548026264292,
"learning_rate": 3.241594690001157e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3639114499092102,
"step": 1455,
"valid_targets_mean": 2435.6,
"valid_targets_min": 798
},
{
"epoch": 2.5172413793103448,
"grad_norm": 0.7739840718205107,
"learning_rate": 3.2348429051199424e-05,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35158008337020874,
"step": 1460,
"valid_targets_mean": 2565.8,
"valid_targets_min": 571
},
{
"epoch": 2.5258620689655173,
"grad_norm": 0.6029145997859495,
"learning_rate": 3.228068300340142e-05,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789810299873352,
"step": 1465,
"valid_targets_mean": 3232.9,
"valid_targets_min": 706
},
{
"epoch": 2.5344827586206895,
"grad_norm": 0.6812715584245135,
"learning_rate": 3.221271000856462e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30192792415618896,
"step": 1470,
"valid_targets_mean": 2195.8,
"valid_targets_min": 534
},
{
"epoch": 2.543103448275862,
"grad_norm": 0.6507849147630267,
"learning_rate": 3.214451132283006e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3988229036331177,
"step": 1475,
"valid_targets_mean": 3180.1,
"valid_targets_min": 721
},
{
"epoch": 2.5517241379310347,
"grad_norm": 0.6225641239120543,
"learning_rate": 3.207608820650955e-05,
"loss": 0.3579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2806398868560791,
"step": 1480,
"valid_targets_mean": 2902.6,
"valid_targets_min": 583
},
{
"epoch": 2.560344827586207,
"grad_norm": 0.7164560899643635,
"learning_rate": 3.2007441924062374e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3189341425895691,
"step": 1485,
"valid_targets_mean": 2501.9,
"valid_targets_min": 528
},
{
"epoch": 2.5689655172413794,
"grad_norm": 1.1127820484519313,
"learning_rate": 3.193857374407192e-05,
"loss": 0.3498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3648238480091095,
"step": 1490,
"valid_targets_mean": 2207.4,
"valid_targets_min": 703
},
{
"epoch": 2.5775862068965516,
"grad_norm": 0.6715513908381312,
"learning_rate": 3.186948493922225e-05,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3119972050189972,
"step": 1495,
"valid_targets_mean": 2720.2,
"valid_targets_min": 993
},
{
"epoch": 2.586206896551724,
"grad_norm": 0.7059911737426282,
"learning_rate": 3.180017678627458e-05,
"loss": 0.3531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30181488394737244,
"step": 1500,
"valid_targets_mean": 2658.7,
"valid_targets_min": 595
},
{
"epoch": 2.594827586206897,
"grad_norm": 0.6789907795293526,
"learning_rate": 3.173065056604366e-05,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32512885332107544,
"step": 1505,
"valid_targets_mean": 2610.2,
"valid_targets_min": 681
},
{
"epoch": 2.603448275862069,
"grad_norm": 0.7487712135796768,
"learning_rate": 3.166090756337415e-05,
"loss": 0.3767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37083733081817627,
"step": 1510,
"valid_targets_mean": 2299.0,
"valid_targets_min": 604
},
{
"epoch": 2.612068965517241,
"grad_norm": 0.7645675510189072,
"learning_rate": 3.159094906711683e-05,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42760002613067627,
"step": 1515,
"valid_targets_mean": 2592.6,
"valid_targets_min": 898
},
{
"epoch": 2.6206896551724137,
"grad_norm": 0.9936249106784035,
"learning_rate": 3.15207763701048e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4002576172351837,
"step": 1520,
"valid_targets_mean": 1749.7,
"valid_targets_min": 642
},
{
"epoch": 2.6293103448275863,
"grad_norm": 0.8230639044983854,
"learning_rate": 3.14503907691296e-05,
"loss": 0.3642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38861727714538574,
"step": 1525,
"valid_targets_mean": 2186.8,
"valid_targets_min": 507
},
{
"epoch": 2.637931034482759,
"grad_norm": 0.8025375712809919,
"learning_rate": 3.1379793564917235e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3810392916202545,
"step": 1530,
"valid_targets_mean": 2889.3,
"valid_targets_min": 643
},
{
"epoch": 2.646551724137931,
"grad_norm": 0.5988230969931015,
"learning_rate": 3.130898606210414e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2393997609615326,
"step": 1535,
"valid_targets_mean": 3076.1,
"valid_targets_min": 462
},
{
"epoch": 2.655172413793103,
"grad_norm": 0.728559481458037,
"learning_rate": 3.1237969569213056e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38803786039352417,
"step": 1540,
"valid_targets_mean": 3300.9,
"valid_targets_min": 463
},
{
"epoch": 2.663793103448276,
"grad_norm": 0.7872815008631463,
"learning_rate": 3.1166745398628874e-05,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38372093439102173,
"step": 1545,
"valid_targets_mean": 2159.7,
"valid_targets_min": 597
},
{
"epoch": 2.6724137931034484,
"grad_norm": 0.7072698084992165,
"learning_rate": 3.109531486657437e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29802533984184265,
"step": 1550,
"valid_targets_mean": 2321.8,
"valid_targets_min": 1013
},
{
"epoch": 2.6810344827586206,
"grad_norm": 0.7613110972073325,
"learning_rate": 3.102367929308586e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3502175211906433,
"step": 1555,
"valid_targets_mean": 2251.6,
"valid_targets_min": 661
},
{
"epoch": 2.689655172413793,
"grad_norm": 0.6782266299730657,
"learning_rate": 3.0951840001988854e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3079949915409088,
"step": 1560,
"valid_targets_mean": 2867.9,
"valid_targets_min": 461
},
{
"epoch": 2.6982758620689653,
"grad_norm": 0.7261807462216028,
"learning_rate": 3.0879798320873546e-05,
"loss": 0.4048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996377646923065,
"step": 1565,
"valid_targets_mean": 2151.3,
"valid_targets_min": 495
},
{
"epoch": 2.706896551724138,
"grad_norm": 0.6937031125933657,
"learning_rate": 3.0807555581070304e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25993096828460693,
"step": 1570,
"valid_targets_mean": 2490.8,
"valid_targets_min": 539
},
{
"epoch": 2.7155172413793105,
"grad_norm": 0.7786261011913469,
"learning_rate": 3.0735113117625045e-05,
"loss": 0.3513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3422274589538574,
"step": 1575,
"valid_targets_mean": 2306.8,
"valid_targets_min": 687
},
{
"epoch": 2.7241379310344827,
"grad_norm": 0.7305876707441854,
"learning_rate": 3.0662472269274617e-05,
"loss": 0.3359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31524696946144104,
"step": 1580,
"valid_targets_mean": 2317.8,
"valid_targets_min": 825
},
{
"epoch": 2.7327586206896552,
"grad_norm": 0.5716678765427254,
"learning_rate": 3.058963437842198e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28373339772224426,
"step": 1585,
"valid_targets_mean": 3168.1,
"valid_targets_min": 623
},
{
"epoch": 2.7413793103448274,
"grad_norm": 0.7402945538942874,
"learning_rate": 3.0516600791111465e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28591129183769226,
"step": 1590,
"valid_targets_mean": 1927.6,
"valid_targets_min": 670
},
{
"epoch": 2.75,
"grad_norm": 0.7215101466312314,
"learning_rate": 3.0443372857003857e-05,
"loss": 0.3378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37307700514793396,
"step": 1595,
"valid_targets_mean": 2697.4,
"valid_targets_min": 810
},
{
"epoch": 2.7586206896551726,
"grad_norm": 0.7518556001114719,
"learning_rate": 3.036995192935149e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46996602416038513,
"step": 1600,
"valid_targets_mean": 3145.1,
"valid_targets_min": 559
},
{
"epoch": 2.7672413793103448,
"grad_norm": 0.6659069040257636,
"learning_rate": 3.029633936497321e-05,
"loss": 0.4064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3989485502243042,
"step": 1605,
"valid_targets_mean": 3162.9,
"valid_targets_min": 954
},
{
"epoch": 2.7758620689655173,
"grad_norm": 0.6831300245308447,
"learning_rate": 3.0222536524229293e-05,
"loss": 0.3488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3316096067428589,
"step": 1610,
"valid_targets_mean": 2702.7,
"valid_targets_min": 667
},
{
"epoch": 2.7844827586206895,
"grad_norm": 0.800951974974391,
"learning_rate": 3.0148544770996343e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3438343405723572,
"step": 1615,
"valid_targets_mean": 2641.6,
"valid_targets_min": 868
},
{
"epoch": 2.793103448275862,
"grad_norm": 0.7425261001470722,
"learning_rate": 3.007436547264207e-05,
"loss": 0.3785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.453504741191864,
"step": 1620,
"valid_targets_mean": 2584.2,
"valid_targets_min": 525
},
{
"epoch": 2.8017241379310347,
"grad_norm": 0.5879356651252614,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.3625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33316174149513245,
"step": 1625,
"valid_targets_mean": 4065.9,
"valid_targets_min": 920
},
{
"epoch": 2.810344827586207,
"grad_norm": 0.706718695443324,
"learning_rate": 2.9925449727344184e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2795742154121399,
"step": 1630,
"valid_targets_mean": 2615.4,
"valid_targets_min": 561
},
{
"epoch": 2.8189655172413794,
"grad_norm": 0.7529444243081488,
"learning_rate": 2.985071603236374e-05,
"loss": 0.3375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4043508768081665,
"step": 1635,
"valid_targets_mean": 2506.1,
"valid_targets_min": 414
},
{
"epoch": 2.8275862068965516,
"grad_norm": 0.8478343119280666,
"learning_rate": 2.9775800296137474e-05,
"loss": 0.3783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4446679353713989,
"step": 1640,
"valid_targets_mean": 1810.9,
"valid_targets_min": 498
},
{
"epoch": 2.836206896551724,
"grad_norm": 0.7560518629172477,
"learning_rate": 2.970070390310828e-05,
"loss": 0.3573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3898079991340637,
"step": 1645,
"valid_targets_mean": 2541.4,
"valid_targets_min": 519
},
{
"epoch": 2.844827586206897,
"grad_norm": 0.8856301975925097,
"learning_rate": 2.962542824105762e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33871254324913025,
"step": 1650,
"valid_targets_mean": 1665.4,
"valid_targets_min": 709
},
{
"epoch": 2.853448275862069,
"grad_norm": 0.6294418184869306,
"learning_rate": 2.954997470107982e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3157624304294586,
"step": 1655,
"valid_targets_mean": 3095.0,
"valid_targets_min": 687
},
{
"epoch": 2.862068965517241,
"grad_norm": 0.8204032206897608,
"learning_rate": 2.947434467755641e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3293578624725342,
"step": 1660,
"valid_targets_mean": 1745.1,
"valid_targets_min": 722
},
{
"epoch": 2.8706896551724137,
"grad_norm": 0.6456585958148404,
"learning_rate": 2.9398539568130327e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4245327115058899,
"step": 1665,
"valid_targets_mean": 3494.4,
"valid_targets_min": 691
},
{
"epoch": 2.8793103448275863,
"grad_norm": 0.8505733892277261,
"learning_rate": 2.9322560773680087e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35134515166282654,
"step": 1670,
"valid_targets_mean": 2579.3,
"valid_targets_min": 1001
},
{
"epoch": 2.887931034482759,
"grad_norm": 0.5659331350418874,
"learning_rate": 2.924640969829393e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2454695701599121,
"step": 1675,
"valid_targets_mean": 3142.8,
"valid_targets_min": 485
},
{
"epoch": 2.896551724137931,
"grad_norm": 0.8263610710384296,
"learning_rate": 2.9170087749243832e-05,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35583004355430603,
"step": 1680,
"valid_targets_mean": 2292.0,
"valid_targets_min": 772
},
{
"epoch": 2.905172413793103,
"grad_norm": 0.7317330072322265,
"learning_rate": 2.9093596336959513e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42089030146598816,
"step": 1685,
"valid_targets_mean": 3087.1,
"valid_targets_min": 1080
},
{
"epoch": 2.913793103448276,
"grad_norm": 0.7090008562368073,
"learning_rate": 2.9016936875002377e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.398629367351532,
"step": 1690,
"valid_targets_mean": 2475.6,
"valid_targets_min": 737
},
{
"epoch": 2.9224137931034484,
"grad_norm": 0.5708369528592575,
"learning_rate": 2.8940110780039385e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2487173229455948,
"step": 1695,
"valid_targets_mean": 2851.6,
"valid_targets_min": 516
},
{
"epoch": 2.9310344827586206,
"grad_norm": 0.8629172656317031,
"learning_rate": 2.8863119471816878e-05,
"loss": 0.3878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45342352986335754,
"step": 1700,
"valid_targets_mean": 2397.3,
"valid_targets_min": 742
},
{
"epoch": 2.939655172413793,
"grad_norm": 0.7017326006705162,
"learning_rate": 2.878596437313434e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3168134093284607,
"step": 1705,
"valid_targets_mean": 2748.8,
"valid_targets_min": 481
},
{
"epoch": 2.9482758620689653,
"grad_norm": 0.9153122090855202,
"learning_rate": 2.87086469098181e-05,
"loss": 0.3652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35482969880104065,
"step": 1710,
"valid_targets_mean": 1666.0,
"valid_targets_min": 398
},
{
"epoch": 2.956896551724138,
"grad_norm": 0.6987207748719971,
"learning_rate": 2.863116851069499e-05,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36330512166023254,
"step": 1715,
"valid_targets_mean": 2604.6,
"valid_targets_min": 451
},
{
"epoch": 2.9655172413793105,
"grad_norm": 0.8404380696602337,
"learning_rate": 2.855353060756593e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3547259569168091,
"step": 1720,
"valid_targets_mean": 1856.7,
"valid_targets_min": 611
},
{
"epoch": 2.9741379310344827,
"grad_norm": 0.8361645261499164,
"learning_rate": 2.8475734635179472e-05,
"loss": 0.3766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3678659498691559,
"step": 1725,
"valid_targets_mean": 1938.4,
"valid_targets_min": 643
},
{
"epoch": 2.9827586206896552,
"grad_norm": 0.6342671412128362,
"learning_rate": 2.8397782031205295e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3068227767944336,
"step": 1730,
"valid_targets_mean": 2862.2,
"valid_targets_min": 424
},
{
"epoch": 2.9913793103448274,
"grad_norm": 0.70350983920623,
"learning_rate": 2.8319674236207634e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.357696533203125,
"step": 1735,
"valid_targets_mean": 2667.8,
"valid_targets_min": 839
},
{
"epoch": 3.0,
"grad_norm": 0.743166212291011,
"learning_rate": 2.8241412693618638e-05,
"loss": 0.374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29470035433769226,
"step": 1740,
"valid_targets_mean": 2023.8,
"valid_targets_min": 586
},
{
"epoch": 3.0086206896551726,
"grad_norm": 0.6224565306001386,
"learning_rate": 2.816299884971173e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32670581340789795,
"step": 1745,
"valid_targets_mean": 3444.1,
"valid_targets_min": 779
},
{
"epoch": 3.0172413793103448,
"grad_norm": 0.7963369151415589,
"learning_rate": 2.8084434153574847e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2679070830345154,
"step": 1750,
"valid_targets_mean": 2331.9,
"valid_targets_min": 617
},
{
"epoch": 3.0258620689655173,
"grad_norm": 0.8324646205431433,
"learning_rate": 2.8005720057083685e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4266745150089264,
"step": 1755,
"valid_targets_mean": 2636.2,
"valid_targets_min": 468
},
{
"epoch": 3.0344827586206895,
"grad_norm": 0.6413595895033111,
"learning_rate": 2.792685801487486e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29419150948524475,
"step": 1760,
"valid_targets_mean": 3145.2,
"valid_targets_min": 534
},
{
"epoch": 3.043103448275862,
"grad_norm": 0.7783389309831885,
"learning_rate": 2.7847849484319008e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32182106375694275,
"step": 1765,
"valid_targets_mean": 2271.4,
"valid_targets_min": 409
},
{
"epoch": 3.0517241379310347,
"grad_norm": 0.9049644291439677,
"learning_rate": 2.7768695925493897e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867991328239441,
"step": 1770,
"valid_targets_mean": 1607.9,
"valid_targets_min": 611
},
{
"epoch": 3.060344827586207,
"grad_norm": 0.6221458496489107,
"learning_rate": 2.7689398801157393e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41518068313598633,
"step": 1775,
"valid_targets_mean": 4899.2,
"valid_targets_min": 844
},
{
"epoch": 3.0689655172413794,
"grad_norm": 0.7613205444804567,
"learning_rate": 2.7609959576720467e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28315573930740356,
"step": 1780,
"valid_targets_mean": 2667.1,
"valid_targets_min": 829
},
{
"epoch": 3.0775862068965516,
"grad_norm": 0.8143413289449313,
"learning_rate": 2.7530379720220096e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27521416544914246,
"step": 1785,
"valid_targets_mean": 1862.4,
"valid_targets_min": 534
},
{
"epoch": 3.086206896551724,
"grad_norm": 0.8480450228379316,
"learning_rate": 2.7450660702292132e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25870606303215027,
"step": 1790,
"valid_targets_mean": 1700.4,
"valid_targets_min": 611
},
{
"epoch": 3.0948275862068964,
"grad_norm": 1.238431131240692,
"learning_rate": 2.7370803996144143e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775198817253113,
"step": 1795,
"valid_targets_mean": 2701.1,
"valid_targets_min": 460
},
{
"epoch": 3.103448275862069,
"grad_norm": 0.8041283864657258,
"learning_rate": 2.7290811077528166e-05,
"loss": 0.3155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3663734793663025,
"step": 1800,
"valid_targets_mean": 2370.8,
"valid_targets_min": 507
},
{
"epoch": 3.1120689655172415,
"grad_norm": 0.8560717116522374,
"learning_rate": 2.7210683424713447e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30424728989601135,
"step": 1805,
"valid_targets_mean": 1917.6,
"valid_targets_min": 612
},
{
"epoch": 3.1206896551724137,
"grad_norm": 0.6705119517885663,
"learning_rate": 2.7130422518459113e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2609316408634186,
"step": 1810,
"valid_targets_mean": 3044.2,
"valid_targets_min": 976
},
{
"epoch": 3.1293103448275863,
"grad_norm": 0.7230075926694457,
"learning_rate": 2.705002984198684e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.301299512386322,
"step": 1815,
"valid_targets_mean": 2647.1,
"valid_targets_min": 638
},
{
"epoch": 3.1379310344827585,
"grad_norm": 0.8100080109130748,
"learning_rate": 2.6969506880953384e-05,
"loss": 0.3179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31657522916793823,
"step": 1820,
"valid_targets_mean": 2186.7,
"valid_targets_min": 631
},
{
"epoch": 3.146551724137931,
"grad_norm": 0.8423669221223422,
"learning_rate": 2.688885512342318e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845194637775421,
"step": 1825,
"valid_targets_mean": 2300.3,
"valid_targets_min": 578
},
{
"epoch": 3.1551724137931036,
"grad_norm": 0.6312094922458577,
"learning_rate": 2.680807605984082e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565772235393524,
"step": 1830,
"valid_targets_mean": 3699.1,
"valid_targets_min": 866
},
{
"epoch": 3.163793103448276,
"grad_norm": 0.7811266015626148,
"learning_rate": 2.6727171183003502e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3389627933502197,
"step": 1835,
"valid_targets_mean": 2511.2,
"valid_targets_min": 495
},
{
"epoch": 3.1724137931034484,
"grad_norm": 0.8432121831699027,
"learning_rate": 2.6646141988033475e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29517269134521484,
"step": 1840,
"valid_targets_mean": 1874.1,
"valid_targets_min": 661
},
{
"epoch": 3.1810344827586206,
"grad_norm": 1.0990805510619235,
"learning_rate": 2.6564989972350364e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2816365957260132,
"step": 1845,
"valid_targets_mean": 3813.9,
"valid_targets_min": 846
},
{
"epoch": 3.189655172413793,
"grad_norm": 0.8279965744680023,
"learning_rate": 2.6483716635643535e-05,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970189154148102,
"step": 1850,
"valid_targets_mean": 2104.2,
"valid_targets_min": 798
},
{
"epoch": 3.1982758620689653,
"grad_norm": 0.8196847761009315,
"learning_rate": 2.6402323479844364e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3160390257835388,
"step": 1855,
"valid_targets_mean": 2641.1,
"valid_targets_min": 937
},
{
"epoch": 3.206896551724138,
"grad_norm": 1.6772060307830066,
"learning_rate": 2.6320812009098472e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2730563282966614,
"step": 1860,
"valid_targets_mean": 2182.1,
"valid_targets_min": 424
},
{
"epoch": 3.2155172413793105,
"grad_norm": 0.6982604978424688,
"learning_rate": 2.6239183729737957e-05,
"loss": 0.37,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999745309352875,
"step": 1865,
"valid_targets_mean": 2517.1,
"valid_targets_min": 796
},
{
"epoch": 3.2241379310344827,
"grad_norm": 0.9495735105999557,
"learning_rate": 2.6157440150253535e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32909655570983887,
"step": 1870,
"valid_targets_mean": 2221.7,
"valid_targets_min": 805
},
{
"epoch": 3.2327586206896552,
"grad_norm": 0.7046523962164161,
"learning_rate": 2.6075582781266665e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26159366965293884,
"step": 1875,
"valid_targets_mean": 2636.9,
"valid_targets_min": 601
},
{
"epoch": 3.2413793103448274,
"grad_norm": 0.742401594365087,
"learning_rate": 2.5993613135501643e-05,
"loss": 0.2981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2503337562084198,
"step": 1880,
"valid_targets_mean": 2461.8,
"valid_targets_min": 895
},
{
"epoch": 3.25,
"grad_norm": 0.81344784045908,
"learning_rate": 2.5911532727757625e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37119442224502563,
"step": 1885,
"valid_targets_mean": 2262.6,
"valid_targets_min": 654
},
{
"epoch": 3.2586206896551726,
"grad_norm": 0.8599496940029792,
"learning_rate": 2.582934307488067e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28416091203689575,
"step": 1890,
"valid_targets_mean": 1887.2,
"valid_targets_min": 528
},
{
"epoch": 3.2672413793103448,
"grad_norm": 0.9973091039588626,
"learning_rate": 2.5747045695735674e-05,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35767045617103577,
"step": 1895,
"valid_targets_mean": 1535.4,
"valid_targets_min": 786
},
{
"epoch": 3.2758620689655173,
"grad_norm": 0.6183796807165394,
"learning_rate": 2.5664642111178312e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26878735423088074,
"step": 1900,
"valid_targets_mean": 3769.8,
"valid_targets_min": 907
},
{
"epoch": 3.2844827586206895,
"grad_norm": 0.5757846667776677,
"learning_rate": 2.5582133844026943e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2681350111961365,
"step": 1905,
"valid_targets_mean": 4193.9,
"valid_targets_min": 712
},
{
"epoch": 3.293103448275862,
"grad_norm": 0.7275958613903811,
"learning_rate": 2.5499522419034462e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21775801479816437,
"step": 1910,
"valid_targets_mean": 2068.1,
"valid_targets_min": 685
},
{
"epoch": 3.3017241379310347,
"grad_norm": 0.648898359722817,
"learning_rate": 2.5416809362860107e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34529179334640503,
"step": 1915,
"valid_targets_mean": 3094.9,
"valid_targets_min": 1146
},
{
"epoch": 3.310344827586207,
"grad_norm": 0.62511185430479,
"learning_rate": 2.5333996204041276e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27681249380111694,
"step": 1920,
"valid_targets_mean": 3492.2,
"valid_targets_min": 737
},
{
"epoch": 3.3189655172413794,
"grad_norm": 0.6618453164474787,
"learning_rate": 2.5251084472965257e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23826207220554352,
"step": 1925,
"valid_targets_mean": 2778.3,
"valid_targets_min": 498
},
{
"epoch": 3.3275862068965516,
"grad_norm": 0.8038892215545382,
"learning_rate": 2.5168075701840948e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291714072227478,
"step": 1930,
"valid_targets_mean": 2213.9,
"valid_targets_min": 543
},
{
"epoch": 3.336206896551724,
"grad_norm": 0.5772711681646889,
"learning_rate": 2.5084971424670568e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17962776124477386,
"step": 1935,
"valid_targets_mean": 2994.7,
"valid_targets_min": 412
},
{
"epoch": 3.344827586206897,
"grad_norm": 0.7120332340970782,
"learning_rate": 2.500177317722126e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869756817817688,
"step": 1940,
"valid_targets_mean": 2739.6,
"valid_targets_min": 606
},
{
"epoch": 3.353448275862069,
"grad_norm": 0.7800922350042635,
"learning_rate": 2.4918482496996757e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766876816749573,
"step": 1945,
"valid_targets_mean": 2119.1,
"valid_targets_min": 654
},
{
"epoch": 3.3620689655172415,
"grad_norm": 0.8737595126801067,
"learning_rate": 2.483510092320895e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3302645981311798,
"step": 1950,
"valid_targets_mean": 1949.8,
"valid_targets_min": 399
},
{
"epoch": 3.3706896551724137,
"grad_norm": 0.648990693564747,
"learning_rate": 2.4751629996749427e-05,
"loss": 0.3201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28055495023727417,
"step": 1955,
"valid_targets_mean": 3328.7,
"valid_targets_min": 523
},
{
"epoch": 3.3793103448275863,
"grad_norm": 0.891540323940474,
"learning_rate": 2.4668071260161022e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3185821771621704,
"step": 1960,
"valid_targets_mean": 2461.1,
"valid_targets_min": 784
},
{
"epoch": 3.3879310344827585,
"grad_norm": 0.6917295377931933,
"learning_rate": 2.4584426257609315e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.218665212392807,
"step": 1965,
"valid_targets_mean": 2213.4,
"valid_targets_min": 756
},
{
"epoch": 3.396551724137931,
"grad_norm": 1.010592244634894,
"learning_rate": 2.4500696534854062e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37055134773254395,
"step": 1970,
"valid_targets_mean": 1879.9,
"valid_targets_min": 583
},
{
"epoch": 3.405172413793103,
"grad_norm": 0.9519123896373668,
"learning_rate": 2.4416883639220647e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33236557245254517,
"step": 1975,
"valid_targets_mean": 2066.6,
"valid_targets_min": 584
},
{
"epoch": 3.413793103448276,
"grad_norm": 0.7323235119643152,
"learning_rate": 2.4332989119571506e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2706213891506195,
"step": 1980,
"valid_targets_mean": 2358.1,
"valid_targets_min": 712
},
{
"epoch": 3.4224137931034484,
"grad_norm": 0.8154170625298807,
"learning_rate": 2.4249014526277473e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3261958658695221,
"step": 1985,
"valid_targets_mean": 2225.0,
"valid_targets_min": 694
},
{
"epoch": 3.4310344827586206,
"grad_norm": 0.7583929734614248,
"learning_rate": 2.416496141118915e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3404994606971741,
"step": 1990,
"valid_targets_mean": 2448.5,
"valid_targets_min": 455
},
{
"epoch": 3.439655172413793,
"grad_norm": 0.76486119481783,
"learning_rate": 2.4080831327608224e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3539115786552429,
"step": 1995,
"valid_targets_mean": 2719.1,
"valid_targets_min": 717
},
{
"epoch": 3.4482758620689653,
"grad_norm": 0.5769571311421944,
"learning_rate": 2.3996625830258742e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36898016929626465,
"step": 2000,
"valid_targets_mean": 4286.1,
"valid_targets_min": 725
},
{
"epoch": 3.456896551724138,
"grad_norm": 0.5832684017230357,
"learning_rate": 2.3912346475258424e-05,
"loss": 0.2961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20343273878097534,
"step": 2005,
"valid_targets_mean": 3749.2,
"valid_targets_min": 953
},
{
"epoch": 3.4655172413793105,
"grad_norm": 0.7460121503250889,
"learning_rate": 2.3827994820089856e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3511773943901062,
"step": 2010,
"valid_targets_mean": 2519.6,
"valid_targets_min": 685
},
{
"epoch": 3.4741379310344827,
"grad_norm": 0.8667582413887146,
"learning_rate": 2.3743572423571752e-05,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2761188745498657,
"step": 2015,
"valid_targets_mean": 1743.6,
"valid_targets_min": 457
},
{
"epoch": 3.4827586206896552,
"grad_norm": 0.8443538913181367,
"learning_rate": 2.365908084583011e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3406338095664978,
"step": 2020,
"valid_targets_mean": 2261.7,
"valid_targets_min": 710
},
{
"epoch": 3.4913793103448274,
"grad_norm": 0.8474513541413226,
"learning_rate": 2.3574521648269406e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867903709411621,
"step": 2025,
"valid_targets_mean": 1912.2,
"valid_targets_min": 607
},
{
"epoch": 3.5,
"grad_norm": 0.7006881241253591,
"learning_rate": 2.3489896393543717e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2570182681083679,
"step": 2030,
"valid_targets_mean": 2751.8,
"valid_targets_min": 871
},
{
"epoch": 3.5086206896551726,
"grad_norm": 0.7552809275843348,
"learning_rate": 2.340520664552788e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30410170555114746,
"step": 2035,
"valid_targets_mean": 2564.1,
"valid_targets_min": 549
},
{
"epoch": 3.5172413793103448,
"grad_norm": 0.8825867836498272,
"learning_rate": 2.3320453969288553e-05,
"loss": 0.3381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3782389760017395,
"step": 2040,
"valid_targets_mean": 1920.1,
"valid_targets_min": 645
},
{
"epoch": 3.5258620689655173,
"grad_norm": 0.7921272597229708,
"learning_rate": 2.32356399310553e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2745018005371094,
"step": 2045,
"valid_targets_mean": 2553.4,
"valid_targets_min": 765
},
{
"epoch": 3.5344827586206895,
"grad_norm": 0.7063871315382729,
"learning_rate": 2.3150766098191667e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25150594115257263,
"step": 2050,
"valid_targets_mean": 2500.0,
"valid_targets_min": 427
},
{
"epoch": 3.543103448275862,
"grad_norm": 0.780288892052238,
"learning_rate": 2.3065834039166212e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3334049582481384,
"step": 2055,
"valid_targets_mean": 2465.0,
"valid_targets_min": 569
},
{
"epoch": 3.5517241379310347,
"grad_norm": 0.7034316364336279,
"learning_rate": 2.2980845323523487e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2297370731830597,
"step": 2060,
"valid_targets_mean": 2638.2,
"valid_targets_min": 596
},
{
"epoch": 3.560344827586207,
"grad_norm": 0.6064369322023231,
"learning_rate": 2.2895801521855096e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2786329984664917,
"step": 2065,
"valid_targets_mean": 4094.6,
"valid_targets_min": 1018
},
{
"epoch": 3.5689655172413794,
"grad_norm": 0.653788622283706,
"learning_rate": 2.2810704205770587e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808879315853119,
"step": 2070,
"valid_targets_mean": 3194.4,
"valid_targets_min": 734
},
{
"epoch": 3.5775862068965516,
"grad_norm": 0.8521494971580398,
"learning_rate": 2.2725554947868495e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24698427319526672,
"step": 2075,
"valid_targets_mean": 1753.4,
"valid_targets_min": 661
},
{
"epoch": 3.586206896551724,
"grad_norm": 0.8795497261182633,
"learning_rate": 2.2640355321707218e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2842119634151459,
"step": 2080,
"valid_targets_mean": 2270.3,
"valid_targets_min": 636
},
{
"epoch": 3.594827586206897,
"grad_norm": 0.7839865726117404,
"learning_rate": 2.2555106901775955e-05,
"loss": 0.3753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2968730032444,
"step": 2085,
"valid_targets_mean": 1988.5,
"valid_targets_min": 593
},
{
"epoch": 3.603448275862069,
"grad_norm": 0.787606769892728,
"learning_rate": 2.246981126346564e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44315293431282043,
"step": 2090,
"valid_targets_mean": 3020.5,
"valid_targets_min": 926
},
{
"epoch": 3.612068965517241,
"grad_norm": 0.610584461944452,
"learning_rate": 2.238446998303977e-05,
"loss": 0.3238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3059382438659668,
"step": 2095,
"valid_targets_mean": 3842.9,
"valid_targets_min": 543
},
{
"epoch": 3.6206896551724137,
"grad_norm": 0.7828264148089181,
"learning_rate": 2.2299084637605343e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29074084758758545,
"step": 2100,
"valid_targets_mean": 2296.9,
"valid_targets_min": 937
},
{
"epoch": 3.6293103448275863,
"grad_norm": 0.8127024938088724,
"learning_rate": 2.221365680508364e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2938804030418396,
"step": 2105,
"valid_targets_mean": 2357.0,
"valid_targets_min": 753
},
{
"epoch": 3.637931034482759,
"grad_norm": 0.7160590569798018,
"learning_rate": 2.2128188064181143e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24818356335163116,
"step": 2110,
"valid_targets_mean": 2373.7,
"valid_targets_min": 574
},
{
"epoch": 3.646551724137931,
"grad_norm": 0.8368002017730753,
"learning_rate": 2.2042679994360296e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32543590664863586,
"step": 2115,
"valid_targets_mean": 1967.9,
"valid_targets_min": 556
},
{
"epoch": 3.655172413793103,
"grad_norm": 0.6869621086443359,
"learning_rate": 2.195713417581033e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35331353545188904,
"step": 2120,
"valid_targets_mean": 3145.4,
"valid_targets_min": 547
},
{
"epoch": 3.663793103448276,
"grad_norm": 1.7802277556554986,
"learning_rate": 2.1871552189418113e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28531312942504883,
"step": 2125,
"valid_targets_mean": 2089.6,
"valid_targets_min": 442
},
{
"epoch": 3.6724137931034484,
"grad_norm": 0.7617925208270429,
"learning_rate": 2.1785935616738855e-05,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25667494535446167,
"step": 2130,
"valid_targets_mean": 2242.4,
"valid_targets_min": 807
},
{
"epoch": 3.6810344827586206,
"grad_norm": 0.8992850081501342,
"learning_rate": 2.170028603996695e-05,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28584620356559753,
"step": 2135,
"valid_targets_mean": 1704.6,
"valid_targets_min": 721
},
{
"epoch": 3.689655172413793,
"grad_norm": 0.7823582786020942,
"learning_rate": 2.161460504190668e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34780627489089966,
"step": 2140,
"valid_targets_mean": 2750.6,
"valid_targets_min": 610
},
{
"epoch": 3.6982758620689653,
"grad_norm": 0.8195994514460628,
"learning_rate": 2.1528894205943017e-05,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3839362859725952,
"step": 2145,
"valid_targets_mean": 2548.4,
"valid_targets_min": 512
},
{
"epoch": 3.706896551724138,
"grad_norm": 0.8494572477645436,
"learning_rate": 2.1443155116012328e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4128968417644501,
"step": 2150,
"valid_targets_mean": 2398.0,
"valid_targets_min": 597
},
{
"epoch": 3.7155172413793105,
"grad_norm": 0.8997195991583952,
"learning_rate": 2.1357389356573098e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27611222863197327,
"step": 2155,
"valid_targets_mean": 1524.3,
"valid_targets_min": 352
},
{
"epoch": 3.7241379310344827,
"grad_norm": 0.7164419636717259,
"learning_rate": 2.1271598512576705e-05,
"loss": 0.3153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35011881589889526,
"step": 2160,
"valid_targets_mean": 2900.4,
"valid_targets_min": 568
},
{
"epoch": 3.7327586206896552,
"grad_norm": 0.8480166956097996,
"learning_rate": 2.1185784169438047e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34647125005722046,
"step": 2165,
"valid_targets_mean": 2132.8,
"valid_targets_min": 733
},
{
"epoch": 3.7413793103448274,
"grad_norm": 0.6292335934505978,
"learning_rate": 2.1099947913006303e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30451124906539917,
"step": 2170,
"valid_targets_mean": 3287.4,
"valid_targets_min": 511
},
{
"epoch": 3.75,
"grad_norm": 0.5754753939117979,
"learning_rate": 2.1014091329535618e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.302144855260849,
"step": 2175,
"valid_targets_mean": 4022.0,
"valid_targets_min": 586
},
{
"epoch": 3.7586206896551726,
"grad_norm": 0.7017710687987908,
"learning_rate": 2.0928216005655762e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2097795307636261,
"step": 2180,
"valid_targets_mean": 2899.4,
"valid_targets_min": 478
},
{
"epoch": 3.7672413793103448,
"grad_norm": 0.9187704585481599,
"learning_rate": 2.084232352834285e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31041762232780457,
"step": 2185,
"valid_targets_mean": 2338.7,
"valid_targets_min": 744
},
{
"epoch": 3.7758620689655173,
"grad_norm": 0.7170011346350758,
"learning_rate": 2.0756415484889975e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23631168901920319,
"step": 2190,
"valid_targets_mean": 2144.9,
"valid_targets_min": 661
},
{
"epoch": 3.7844827586206895,
"grad_norm": 0.8606344295508895,
"learning_rate": 2.0670493462877897e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32752877473831177,
"step": 2195,
"valid_targets_mean": 1855.7,
"valid_targets_min": 430
},
{
"epoch": 3.793103448275862,
"grad_norm": 0.7682771055577163,
"learning_rate": 2.0584559050145706e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48432260751724243,
"step": 2200,
"valid_targets_mean": 3133.6,
"valid_targets_min": 561
},
{
"epoch": 3.8017241379310347,
"grad_norm": 0.8349304825117818,
"learning_rate": 2.0498613834761462e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010793924331665,
"step": 2205,
"valid_targets_mean": 2094.9,
"valid_targets_min": 634
},
{
"epoch": 3.810344827586207,
"grad_norm": 0.670157550483695,
"learning_rate": 2.0412659404992862e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2826797068119049,
"step": 2210,
"valid_targets_mean": 3276.9,
"valid_targets_min": 479
},
{
"epoch": 3.8189655172413794,
"grad_norm": 0.733561876185473,
"learning_rate": 2.0326697349277893e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30336707830429077,
"step": 2215,
"valid_targets_mean": 2686.1,
"valid_targets_min": 772
},
{
"epoch": 3.8275862068965516,
"grad_norm": 0.7049773389785631,
"learning_rate": 2.024072925619546e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26717764139175415,
"step": 2220,
"valid_targets_mean": 3601.4,
"valid_targets_min": 738
},
{
"epoch": 3.836206896551724,
"grad_norm": 0.8019247619108416,
"learning_rate": 2.0154756714436043e-05,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339763283729553,
"step": 2225,
"valid_targets_mean": 2529.2,
"valid_targets_min": 567
},
{
"epoch": 3.844827586206897,
"grad_norm": 0.8139666943159004,
"learning_rate": 2.006878131277233e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815071940422058,
"step": 2230,
"valid_targets_mean": 2022.9,
"valid_targets_min": 523
},
{
"epoch": 3.853448275862069,
"grad_norm": 0.713112858060529,
"learning_rate": 1.9982804640029864e-05,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3495800197124481,
"step": 2235,
"valid_targets_mean": 2557.1,
"valid_targets_min": 522
},
{
"epoch": 3.862068965517241,
"grad_norm": 0.9058457107189625,
"learning_rate": 1.989682828505767e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3590564727783203,
"step": 2240,
"valid_targets_mean": 1953.3,
"valid_targets_min": 389
},
{
"epoch": 3.8706896551724137,
"grad_norm": 0.7293645847517138,
"learning_rate": 1.9810853836698913e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24753639101982117,
"step": 2245,
"valid_targets_mean": 2149.6,
"valid_targets_min": 619
},
{
"epoch": 3.8793103448275863,
"grad_norm": 0.7031641747976873,
"learning_rate": 1.972488288376151e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2974679470062256,
"step": 2250,
"valid_targets_mean": 2780.9,
"valid_targets_min": 470
},
{
"epoch": 3.887931034482759,
"grad_norm": 0.8885166742958897,
"learning_rate": 1.963891701498879e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31055015325546265,
"step": 2255,
"valid_targets_mean": 1596.9,
"valid_targets_min": 642
},
{
"epoch": 3.896551724137931,
"grad_norm": 0.7261435079831179,
"learning_rate": 1.955295781903014e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24428752064704895,
"step": 2260,
"valid_targets_mean": 2453.4,
"valid_targets_min": 674
},
{
"epoch": 3.905172413793103,
"grad_norm": 0.8246463215353056,
"learning_rate": 1.9467006884411605e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3109739422798157,
"step": 2265,
"valid_targets_mean": 2420.3,
"valid_targets_min": 748
},
{
"epoch": 3.913793103448276,
"grad_norm": 0.6601682761330331,
"learning_rate": 1.9381065799506583e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506582736968994,
"step": 2270,
"valid_targets_mean": 3001.2,
"valid_targets_min": 787
},
{
"epoch": 3.9224137931034484,
"grad_norm": 0.6334105777237168,
"learning_rate": 1.929513615250643e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3046247363090515,
"step": 2275,
"valid_targets_mean": 3295.7,
"valid_targets_min": 979
},
{
"epoch": 3.9310344827586206,
"grad_norm": 0.6634253062353758,
"learning_rate": 1.9209219531391155e-05,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28064969182014465,
"step": 2280,
"valid_targets_mean": 3317.7,
"valid_targets_min": 510
},
{
"epoch": 3.939655172413793,
"grad_norm": 0.8241315570534355,
"learning_rate": 1.9123317523900015e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3636839687824249,
"step": 2285,
"valid_targets_mean": 2278.6,
"valid_targets_min": 765
},
{
"epoch": 3.9482758620689653,
"grad_norm": 0.5973298614024068,
"learning_rate": 1.9037431717502253e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3552555441856384,
"step": 2290,
"valid_targets_mean": 4570.8,
"valid_targets_min": 545
},
{
"epoch": 3.956896551724138,
"grad_norm": 0.7125951830374488,
"learning_rate": 1.8951563699367673e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534135580062866,
"step": 2295,
"valid_targets_mean": 2782.2,
"valid_targets_min": 644
},
{
"epoch": 3.9655172413793105,
"grad_norm": 0.7013488738121144,
"learning_rate": 1.886571505633737e-05,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3117072284221649,
"step": 2300,
"valid_targets_mean": 2736.2,
"valid_targets_min": 791
},
{
"epoch": 3.9741379310344827,
"grad_norm": 0.7932404713933431,
"learning_rate": 1.8779887374894384e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304098516702652,
"step": 2305,
"valid_targets_mean": 2292.9,
"valid_targets_min": 773
},
{
"epoch": 3.9827586206896552,
"grad_norm": 0.7615525880276409,
"learning_rate": 1.8694082241134385e-05,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3014771342277527,
"step": 2310,
"valid_targets_mean": 2608.2,
"valid_targets_min": 822
},
{
"epoch": 3.9913793103448274,
"grad_norm": 0.7054702340895173,
"learning_rate": 1.8608301240736378e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3216426968574524,
"step": 2315,
"valid_targets_mean": 2888.3,
"valid_targets_min": 519
},
{
"epoch": 4.0,
"grad_norm": 0.8671769739177089,
"learning_rate": 1.852254595893335e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3277759850025177,
"step": 2320,
"valid_targets_mean": 2034.9,
"valid_targets_min": 679
},
{
"epoch": 4.008620689655173,
"grad_norm": 0.8662049706352303,
"learning_rate": 1.8436817980483035e-05,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23021268844604492,
"step": 2325,
"valid_targets_mean": 1730.6,
"valid_targets_min": 547
},
{
"epoch": 4.017241379310345,
"grad_norm": 0.7888888970206421,
"learning_rate": 1.835111888963859e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3193662464618683,
"step": 2330,
"valid_targets_mean": 2617.9,
"valid_targets_min": 807
},
{
"epoch": 4.025862068965517,
"grad_norm": 0.8050736339071413,
"learning_rate": 1.8265450270119335e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23052524030208588,
"step": 2335,
"valid_targets_mean": 2918.8,
"valid_targets_min": 545
},
{
"epoch": 4.0344827586206895,
"grad_norm": 0.8104059449972785,
"learning_rate": 1.8179813705081468e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25504401326179504,
"step": 2340,
"valid_targets_mean": 2983.4,
"valid_targets_min": 519
},
{
"epoch": 4.043103448275862,
"grad_norm": 0.7353605793149197,
"learning_rate": 1.8094210777088833e-05,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252414733171463,
"step": 2345,
"valid_targets_mean": 2531.2,
"valid_targets_min": 622
},
{
"epoch": 4.051724137931035,
"grad_norm": 0.6092689710576782,
"learning_rate": 1.800864306808367e-05,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20068293809890747,
"step": 2350,
"valid_targets_mean": 3792.4,
"valid_targets_min": 651
},
{
"epoch": 4.060344827586207,
"grad_norm": 0.858412056979054,
"learning_rate": 1.7923112159357344e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28051990270614624,
"step": 2355,
"valid_targets_mean": 2174.3,
"valid_targets_min": 875
},
{
"epoch": 4.068965517241379,
"grad_norm": 0.8572346124316681,
"learning_rate": 1.783761963152117e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31026482582092285,
"step": 2360,
"valid_targets_mean": 2267.0,
"valid_targets_min": 827
},
{
"epoch": 4.077586206896552,
"grad_norm": 0.9678784332310315,
"learning_rate": 1.7752167064477173e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29770296812057495,
"step": 2365,
"valid_targets_mean": 1884.4,
"valid_targets_min": 583
},
{
"epoch": 4.086206896551724,
"grad_norm": 0.7779777387424832,
"learning_rate": 1.7666756037388923e-05,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32733461260795593,
"step": 2370,
"valid_targets_mean": 2521.4,
"valid_targets_min": 485
},
{
"epoch": 4.094827586206897,
"grad_norm": 0.9267768621801464,
"learning_rate": 1.7581388128652315e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2627328038215637,
"step": 2375,
"valid_targets_mean": 2000.8,
"valid_targets_min": 679
},
{
"epoch": 4.103448275862069,
"grad_norm": 0.9298458568007258,
"learning_rate": 1.7496064915866414e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2559812068939209,
"step": 2380,
"valid_targets_mean": 1880.1,
"valid_targets_min": 873
},
{
"epoch": 4.112068965517241,
"grad_norm": 0.7420079443094495,
"learning_rate": 1.7410787975804314e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20432040095329285,
"step": 2385,
"valid_targets_mean": 2497.0,
"valid_targets_min": 1002
},
{
"epoch": 4.120689655172414,
"grad_norm": 0.9139413054677984,
"learning_rate": 1.732555888438398e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2299332469701767,
"step": 2390,
"valid_targets_mean": 1902.1,
"valid_targets_min": 472
},
{
"epoch": 4.129310344827586,
"grad_norm": 0.9093389443991601,
"learning_rate": 1.7240379216639136e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951817512512207,
"step": 2395,
"valid_targets_mean": 2019.4,
"valid_targets_min": 584
},
{
"epoch": 4.137931034482759,
"grad_norm": 0.7632400394885388,
"learning_rate": 1.7155250546690173e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2085626870393753,
"step": 2400,
"valid_targets_mean": 2969.6,
"valid_targets_min": 641
},
{
"epoch": 4.146551724137931,
"grad_norm": 0.8260537770861034,
"learning_rate": 1.707017444771502e-05,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2482033669948578,
"step": 2405,
"valid_targets_mean": 2091.2,
"valid_targets_min": 820
},
{
"epoch": 4.155172413793103,
"grad_norm": 0.6923161253459018,
"learning_rate": 1.6985152491920103e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20103991031646729,
"step": 2410,
"valid_targets_mean": 2961.4,
"valid_targets_min": 572
},
{
"epoch": 4.163793103448276,
"grad_norm": 0.723678400646684,
"learning_rate": 1.690018625051128e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2579345107078552,
"step": 2415,
"valid_targets_mean": 2701.3,
"valid_targets_min": 935
},
{
"epoch": 4.172413793103448,
"grad_norm": 0.7494143777775046,
"learning_rate": 1.681527729366481e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2361277937889099,
"step": 2420,
"valid_targets_mean": 2569.4,
"valid_targets_min": 462
},
{
"epoch": 4.181034482758621,
"grad_norm": 0.9112887953263451,
"learning_rate": 1.673042719049834e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863658666610718,
"step": 2425,
"valid_targets_mean": 2074.4,
"valid_targets_min": 615
},
{
"epoch": 4.189655172413793,
"grad_norm": 0.7937887670056066,
"learning_rate": 1.664563750904188e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2154037058353424,
"step": 2430,
"valid_targets_mean": 2729.9,
"valid_targets_min": 743
},
{
"epoch": 4.198275862068965,
"grad_norm": 0.7433928051105411,
"learning_rate": 1.656090981620888e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24456550180912018,
"step": 2435,
"valid_targets_mean": 2620.4,
"valid_targets_min": 599
},
{
"epoch": 4.206896551724138,
"grad_norm": 1.045004846134096,
"learning_rate": 1.64762456777672e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2445065975189209,
"step": 2440,
"valid_targets_mean": 1532.7,
"valid_targets_min": 539
},
{
"epoch": 4.2155172413793105,
"grad_norm": 0.8682943506947929,
"learning_rate": 1.6391646658310242e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688167989253998,
"step": 2445,
"valid_targets_mean": 2110.8,
"valid_targets_min": 536
},
{
"epoch": 4.224137931034483,
"grad_norm": 0.7496628558965965,
"learning_rate": 1.6307114321227996e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.280312180519104,
"step": 2450,
"valid_targets_mean": 2859.6,
"valid_targets_min": 1013
},
{
"epoch": 4.232758620689655,
"grad_norm": 0.8178573339580305,
"learning_rate": 1.622265022867818e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3833100199699402,
"step": 2455,
"valid_targets_mean": 2496.7,
"valid_targets_min": 710
},
{
"epoch": 4.241379310344827,
"grad_norm": 0.8958331031395433,
"learning_rate": 1.6138255941557336e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23110151290893555,
"step": 2460,
"valid_targets_mean": 2041.5,
"valid_targets_min": 690
},
{
"epoch": 4.25,
"grad_norm": 1.2008802918634554,
"learning_rate": 1.6053933019472003e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23847255110740662,
"step": 2465,
"valid_targets_mean": 2182.4,
"valid_targets_min": 738
},
{
"epoch": 4.258620689655173,
"grad_norm": 0.7253739780355688,
"learning_rate": 1.5969683020709902e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19945028424263,
"step": 2470,
"valid_targets_mean": 3067.0,
"valid_targets_min": 907
},
{
"epoch": 4.267241379310345,
"grad_norm": 0.7944155046031013,
"learning_rate": 1.5885507502211108e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24398934841156006,
"step": 2475,
"valid_targets_mean": 2691.2,
"valid_targets_min": 600
},
{
"epoch": 4.275862068965517,
"grad_norm": 0.7602735777735121,
"learning_rate": 1.5801408019539345e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26826539635658264,
"step": 2480,
"valid_targets_mean": 2809.9,
"valid_targets_min": 736
},
{
"epoch": 4.2844827586206895,
"grad_norm": 0.8482564423959594,
"learning_rate": 1.5717386126853156e-05,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2374395728111267,
"step": 2485,
"valid_targets_mean": 2188.2,
"valid_targets_min": 553
},
{
"epoch": 4.293103448275862,
"grad_norm": 0.885080946312999,
"learning_rate": 1.5633443376877236e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21632343530654907,
"step": 2490,
"valid_targets_mean": 1872.2,
"valid_targets_min": 683
},
{
"epoch": 4.301724137931035,
"grad_norm": 0.7270077139583213,
"learning_rate": 1.5549581320873715e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23827451467514038,
"step": 2495,
"valid_targets_mean": 2864.6,
"valid_targets_min": 560
},
{
"epoch": 4.310344827586207,
"grad_norm": 0.884280348292525,
"learning_rate": 1.546580150861351e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2653864026069641,
"step": 2500,
"valid_targets_mean": 2208.6,
"valid_targets_min": 616
},
{
"epoch": 4.318965517241379,
"grad_norm": 0.7511935061914762,
"learning_rate": 1.5382105488347654e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2234722077846527,
"step": 2505,
"valid_targets_mean": 2560.5,
"valid_targets_min": 907
},
{
"epoch": 4.327586206896552,
"grad_norm": 0.6927902145845654,
"learning_rate": 1.5298494806778733e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3259279429912567,
"step": 2510,
"valid_targets_mean": 3623.5,
"valid_targets_min": 424
},
{
"epoch": 4.336206896551724,
"grad_norm": 0.9363964007863711,
"learning_rate": 1.5214971009032251e-05,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27032387256622314,
"step": 2515,
"valid_targets_mean": 2325.2,
"valid_targets_min": 674
},
{
"epoch": 4.344827586206897,
"grad_norm": 0.6946434774843553,
"learning_rate": 1.51315356386281e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19004008173942566,
"step": 2520,
"valid_targets_mean": 2366.9,
"valid_targets_min": 578
},
{
"epoch": 4.353448275862069,
"grad_norm": 0.8539126756883658,
"learning_rate": 1.5048190237452052e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525019645690918,
"step": 2525,
"valid_targets_mean": 2396.6,
"valid_targets_min": 516
},
{
"epoch": 4.362068965517241,
"grad_norm": 0.79778758981723,
"learning_rate": 1.4964936345727217e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2425791621208191,
"step": 2530,
"valid_targets_mean": 2591.4,
"valid_targets_min": 463
},
{
"epoch": 4.370689655172414,
"grad_norm": 0.9069366963385622,
"learning_rate": 1.4881775501985645e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515653371810913,
"step": 2535,
"valid_targets_mean": 2669.3,
"valid_targets_min": 409
},
{
"epoch": 4.379310344827586,
"grad_norm": 0.7963250270457406,
"learning_rate": 1.4798709243039842e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21995809674263,
"step": 2540,
"valid_targets_mean": 2314.8,
"valid_targets_min": 839
},
{
"epoch": 4.387931034482759,
"grad_norm": 0.9179745890697341,
"learning_rate": 1.4715739103954375e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25221094489097595,
"step": 2545,
"valid_targets_mean": 2191.8,
"valid_targets_min": 933
},
{
"epoch": 4.396551724137931,
"grad_norm": 0.6622828676925838,
"learning_rate": 1.4632866618017543e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25719982385635376,
"step": 2550,
"valid_targets_mean": 3660.8,
"valid_targets_min": 1160
},
{
"epoch": 4.405172413793103,
"grad_norm": 0.8591681509143264,
"learning_rate": 1.4550093316712987e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24447187781333923,
"step": 2555,
"valid_targets_mean": 2159.6,
"valid_targets_min": 721
},
{
"epoch": 4.413793103448276,
"grad_norm": 0.7666460077302556,
"learning_rate": 1.4467420729691433e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23079776763916016,
"step": 2560,
"valid_targets_mean": 2426.2,
"valid_targets_min": 429
},
{
"epoch": 4.422413793103448,
"grad_norm": 0.8628984095026991,
"learning_rate": 1.4384850384742412e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20822520554065704,
"step": 2565,
"valid_targets_mean": 2130.8,
"valid_targets_min": 783
},
{
"epoch": 4.431034482758621,
"grad_norm": 0.6655183257870557,
"learning_rate": 1.4302383807766003e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23718425631523132,
"step": 2570,
"valid_targets_mean": 3646.4,
"valid_targets_min": 893
},
{
"epoch": 4.439655172413793,
"grad_norm": 0.9842333882472362,
"learning_rate": 1.4220022522744667e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2799840569496155,
"step": 2575,
"valid_targets_mean": 1720.6,
"valid_targets_min": 474
},
{
"epoch": 4.448275862068965,
"grad_norm": 0.826442375777945,
"learning_rate": 1.4137768051715059e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25755539536476135,
"step": 2580,
"valid_targets_mean": 2250.4,
"valid_targets_min": 964
},
{
"epoch": 4.456896551724138,
"grad_norm": 0.8335441437915141,
"learning_rate": 1.4055621914739915e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718716859817505,
"step": 2585,
"valid_targets_mean": 2529.5,
"valid_targets_min": 950
},
{
"epoch": 4.4655172413793105,
"grad_norm": 0.5992395028797994,
"learning_rate": 1.3973585629879973e-05,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20316217839717865,
"step": 2590,
"valid_targets_mean": 4162.9,
"valid_targets_min": 561
},
{
"epoch": 4.474137931034483,
"grad_norm": 0.5884128756243574,
"learning_rate": 1.3891660713165873e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20528560876846313,
"step": 2595,
"valid_targets_mean": 3888.8,
"valid_targets_min": 1177
},
{
"epoch": 4.482758620689655,
"grad_norm": 0.927923085075217,
"learning_rate": 1.3809848678570204e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20741838216781616,
"step": 2600,
"valid_targets_mean": 1499.1,
"valid_targets_min": 549
},
{
"epoch": 4.491379310344827,
"grad_norm": 0.6804876534067182,
"learning_rate": 1.3728151037979468e-05,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2584356665611267,
"step": 2605,
"valid_targets_mean": 3414.1,
"valid_targets_min": 343
},
{
"epoch": 4.5,
"grad_norm": 0.8331576647298734,
"learning_rate": 1.3646569301166177e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19165021181106567,
"step": 2610,
"valid_targets_mean": 2333.8,
"valid_targets_min": 589
},
{
"epoch": 4.508620689655173,
"grad_norm": 0.8201431783332219,
"learning_rate": 1.3565104975760936e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27077627182006836,
"step": 2615,
"valid_targets_mean": 2511.2,
"valid_targets_min": 511
},
{
"epoch": 4.517241379310345,
"grad_norm": 0.9034946742282952,
"learning_rate": 1.34837595672246e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28327399492263794,
"step": 2620,
"valid_targets_mean": 2170.9,
"valid_targets_min": 648
},
{
"epoch": 4.525862068965517,
"grad_norm": 0.7195977109229138,
"learning_rate": 1.3402534578820428e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2510998547077179,
"step": 2625,
"valid_targets_mean": 2907.8,
"valid_targets_min": 762
},
{
"epoch": 4.5344827586206895,
"grad_norm": 0.7377623184998696,
"learning_rate": 1.3321431511586308e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23612627387046814,
"step": 2630,
"valid_targets_mean": 2875.3,
"valid_targets_min": 848
},
{
"epoch": 4.543103448275862,
"grad_norm": 0.6492806402613284,
"learning_rate": 1.3240451864307048e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24571189284324646,
"step": 2635,
"valid_targets_mean": 3630.4,
"valid_targets_min": 772
},
{
"epoch": 4.551724137931035,
"grad_norm": 0.8073728194218844,
"learning_rate": 1.3159597133486628e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24010978639125824,
"step": 2640,
"valid_targets_mean": 2459.0,
"valid_targets_min": 561
},
{
"epoch": 4.560344827586206,
"grad_norm": 0.7825834526443618,
"learning_rate": 1.3078868813320594e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30113720893859863,
"step": 2645,
"valid_targets_mean": 2919.1,
"valid_targets_min": 970
},
{
"epoch": 4.568965517241379,
"grad_norm": 0.8053544868678272,
"learning_rate": 1.2998268395668412e-05,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2285986840724945,
"step": 2650,
"valid_targets_mean": 2252.1,
"valid_targets_min": 558
},
{
"epoch": 4.577586206896552,
"grad_norm": 0.7286795475876217,
"learning_rate": 1.2917797370025908e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20709648728370667,
"step": 2655,
"valid_targets_mean": 2482.2,
"valid_targets_min": 768
},
{
"epoch": 4.586206896551724,
"grad_norm": 0.7980126972228626,
"learning_rate": 1.2837457223497754e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2862476408481598,
"step": 2660,
"valid_targets_mean": 2788.4,
"valid_targets_min": 299
},
{
"epoch": 4.594827586206897,
"grad_norm": 0.9547103713318049,
"learning_rate": 1.2757249440769957e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612942159175873,
"step": 2665,
"valid_targets_mean": 2043.6,
"valid_targets_min": 495
},
{
"epoch": 4.603448275862069,
"grad_norm": 0.905981008508086,
"learning_rate": 1.2677175504082452e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2664405107498169,
"step": 2670,
"valid_targets_mean": 2115.1,
"valid_targets_min": 574
},
{
"epoch": 4.612068965517241,
"grad_norm": 0.7140183681440331,
"learning_rate": 1.2597236893201712e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34579741954803467,
"step": 2675,
"valid_targets_mean": 4065.8,
"valid_targets_min": 756
},
{
"epoch": 4.620689655172414,
"grad_norm": 0.6892440746656789,
"learning_rate": 1.2517435085393373e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21152852475643158,
"step": 2680,
"valid_targets_mean": 3078.9,
"valid_targets_min": 684
},
{
"epoch": 4.629310344827586,
"grad_norm": 0.8486268587233803,
"learning_rate": 1.2437771555394944e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2553647756576538,
"step": 2685,
"valid_targets_mean": 2060.7,
"valid_targets_min": 870
},
{
"epoch": 4.637931034482759,
"grad_norm": 0.6729119974556853,
"learning_rate": 1.2358247775388578e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291421502828598,
"step": 2690,
"valid_targets_mean": 3406.8,
"valid_targets_min": 479
},
{
"epoch": 4.646551724137931,
"grad_norm": 0.9670461613890826,
"learning_rate": 1.227886521497383e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571569085121155,
"step": 2695,
"valid_targets_mean": 1696.8,
"valid_targets_min": 561
},
{
"epoch": 4.655172413793103,
"grad_norm": 0.9756750116337135,
"learning_rate": 1.2199625341140533e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31376075744628906,
"step": 2700,
"valid_targets_mean": 2084.3,
"valid_targets_min": 737
},
{
"epoch": 4.663793103448276,
"grad_norm": 0.8118045075648823,
"learning_rate": 1.2120529618241665e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2494584619998932,
"step": 2705,
"valid_targets_mean": 2730.1,
"valid_targets_min": 644
},
{
"epoch": 4.672413793103448,
"grad_norm": 0.7694865435535756,
"learning_rate": 1.2041579507966288e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23829087615013123,
"step": 2710,
"valid_targets_mean": 2551.9,
"valid_targets_min": 838
},
{
"epoch": 4.681034482758621,
"grad_norm": 0.9076282780504955,
"learning_rate": 1.1962776469312556e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3020887076854706,
"step": 2715,
"valid_targets_mean": 2050.4,
"valid_targets_min": 798
},
{
"epoch": 4.689655172413794,
"grad_norm": 0.984237292189467,
"learning_rate": 1.1884121958560721e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2580467462539673,
"step": 2720,
"valid_targets_mean": 1632.6,
"valid_targets_min": 667
},
{
"epoch": 4.698275862068965,
"grad_norm": 0.8914302319151403,
"learning_rate": 1.1805617429246254e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4029195308685303,
"step": 2725,
"valid_targets_mean": 2773.8,
"valid_targets_min": 468
},
{
"epoch": 4.706896551724138,
"grad_norm": 0.8839779314527022,
"learning_rate": 1.1727264332132978e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26910024881362915,
"step": 2730,
"valid_targets_mean": 2261.6,
"valid_targets_min": 653
},
{
"epoch": 4.7155172413793105,
"grad_norm": 0.8225743421333721,
"learning_rate": 1.1649064115186216e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.270842969417572,
"step": 2735,
"valid_targets_mean": 2445.1,
"valid_targets_min": 581
},
{
"epoch": 4.724137931034483,
"grad_norm": 0.8877295961730737,
"learning_rate": 1.1571018223546095e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2545921802520752,
"step": 2740,
"valid_targets_mean": 2293.9,
"valid_targets_min": 733
},
{
"epoch": 4.732758620689655,
"grad_norm": 0.9014458800755352,
"learning_rate": 1.1493128099500806e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19791623950004578,
"step": 2745,
"valid_targets_mean": 2367.0,
"valid_targets_min": 1119
},
{
"epoch": 4.741379310344827,
"grad_norm": 0.8402569938502772,
"learning_rate": 1.1415395182459925e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3597656190395355,
"step": 2750,
"valid_targets_mean": 2686.0,
"valid_targets_min": 708
},
{
"epoch": 4.75,
"grad_norm": 0.7089169362206015,
"learning_rate": 1.1337820908927891e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29866451025009155,
"step": 2755,
"valid_targets_mean": 3162.3,
"valid_targets_min": 779
},
{
"epoch": 4.758620689655173,
"grad_norm": 0.9099687598408538,
"learning_rate": 1.126040671247738e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32522955536842346,
"step": 2760,
"valid_targets_mean": 2540.8,
"valid_targets_min": 487
},
{
"epoch": 4.767241379310345,
"grad_norm": 0.715299266743667,
"learning_rate": 1.1183154023722839e-05,
"loss": 0.3053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26378440856933594,
"step": 2765,
"valid_targets_mean": 3656.9,
"valid_targets_min": 714
},
{
"epoch": 4.775862068965517,
"grad_norm": 0.8044464553170273,
"learning_rate": 1.1106064270294068e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24478477239608765,
"step": 2770,
"valid_targets_mean": 2387.5,
"valid_targets_min": 708
},
{
"epoch": 4.7844827586206895,
"grad_norm": 0.8572643434070522,
"learning_rate": 1.1029138876809818e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2885858714580536,
"step": 2775,
"valid_targets_mean": 2269.8,
"valid_targets_min": 730
},
{
"epoch": 4.793103448275862,
"grad_norm": 0.8831366905295249,
"learning_rate": 1.0952379264851464e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25413423776626587,
"step": 2780,
"valid_targets_mean": 1837.9,
"valid_targets_min": 575
},
{
"epoch": 4.801724137931035,
"grad_norm": 0.7537924671729679,
"learning_rate": 1.087578685293674e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21763187646865845,
"step": 2785,
"valid_targets_mean": 2566.1,
"valid_targets_min": 627
},
{
"epoch": 4.810344827586206,
"grad_norm": 0.7703574579799106,
"learning_rate": 1.0799363056493529e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20490054786205292,
"step": 2790,
"valid_targets_mean": 2255.1,
"valid_targets_min": 607
},
{
"epoch": 4.818965517241379,
"grad_norm": 0.8233927826656027,
"learning_rate": 1.0723109287833697e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2616879940032959,
"step": 2795,
"valid_targets_mean": 2616.1,
"valid_targets_min": 679
},
{
"epoch": 4.827586206896552,
"grad_norm": 0.8032320228650361,
"learning_rate": 1.0647026956126979e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26382285356521606,
"step": 2800,
"valid_targets_mean": 2502.1,
"valid_targets_min": 412
},
{
"epoch": 4.836206896551724,
"grad_norm": 0.6432642583887519,
"learning_rate": 1.0571117467374972e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29295748472213745,
"step": 2805,
"valid_targets_mean": 3958.2,
"valid_targets_min": 600
},
{
"epoch": 4.844827586206897,
"grad_norm": 0.8550150623571411,
"learning_rate": 1.0495382224385154e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27578306198120117,
"step": 2810,
"valid_targets_mean": 2180.1,
"valid_targets_min": 437
},
{
"epoch": 4.853448275862069,
"grad_norm": 0.8282277450172278,
"learning_rate": 1.0419822626744894e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23954559862613678,
"step": 2815,
"valid_targets_mean": 2158.8,
"valid_targets_min": 586
},
{
"epoch": 4.862068965517241,
"grad_norm": 0.739519390252053,
"learning_rate": 1.0344440070795671e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24350044131278992,
"step": 2820,
"valid_targets_mean": 2944.4,
"valid_targets_min": 567
},
{
"epoch": 4.870689655172414,
"grad_norm": 0.6351145044807031,
"learning_rate": 1.0269235949607223e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.388615220785141,
"step": 2825,
"valid_targets_mean": 4205.4,
"valid_targets_min": 713
},
{
"epoch": 4.879310344827586,
"grad_norm": 0.9737679102183793,
"learning_rate": 1.019421165295182e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30197206139564514,
"step": 2830,
"valid_targets_mean": 1733.2,
"valid_targets_min": 787
},
{
"epoch": 4.887931034482759,
"grad_norm": 0.6615703692662012,
"learning_rate": 1.0119368567278545e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22386646270751953,
"step": 2835,
"valid_targets_mean": 3164.2,
"valid_targets_min": 1170
},
{
"epoch": 4.896551724137931,
"grad_norm": 0.9421012456482122,
"learning_rate": 1.0044708075687746e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27233490347862244,
"step": 2840,
"valid_targets_mean": 1674.3,
"valid_targets_min": 454
},
{
"epoch": 4.905172413793103,
"grad_norm": 0.6755294173673939,
"learning_rate": 9.97023155790541e-06,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.362407386302948,
"step": 2845,
"valid_targets_mean": 3552.1,
"valid_targets_min": 713
},
{
"epoch": 4.913793103448276,
"grad_norm": 0.7331491510364737,
"learning_rate": 9.895940390257675e-06,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2711232602596283,
"step": 2850,
"valid_targets_mean": 3487.1,
"valid_targets_min": 1102
},
{
"epoch": 4.922413793103448,
"grad_norm": 0.9290584095263694,
"learning_rate": 9.821835945645426e-06,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2613976001739502,
"step": 2855,
"valid_targets_mean": 1895.8,
"valid_targets_min": 546
},
{
"epoch": 4.931034482758621,
"grad_norm": 0.7712276355626331,
"learning_rate": 9.747919593518897e-06,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23783954977989197,
"step": 2860,
"valid_targets_mean": 2612.0,
"valid_targets_min": 1141
},
{
"epoch": 4.939655172413794,
"grad_norm": 0.915887245911443,
"learning_rate": 9.674192699852397e-06,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635113000869751,
"step": 2865,
"valid_targets_mean": 2107.1,
"valid_targets_min": 431
},
{
"epoch": 4.948275862068965,
"grad_norm": 0.8107696850116063,
"learning_rate": 9.600656627119e-06,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25736725330352783,
"step": 2870,
"valid_targets_mean": 2507.6,
"valid_targets_min": 729
},
{
"epoch": 4.956896551724138,
"grad_norm": 0.8281895858985249,
"learning_rate": 9.52731273426544e-06,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27084803581237793,
"step": 2875,
"valid_targets_mean": 2390.9,
"valid_targets_min": 521
},
{
"epoch": 4.9655172413793105,
"grad_norm": 0.8513496909637406,
"learning_rate": 9.454162376686959e-06,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3300788998603821,
"step": 2880,
"valid_targets_mean": 2519.0,
"valid_targets_min": 531
},
{
"epoch": 4.974137931034483,
"grad_norm": 0.7655388287695867,
"learning_rate": 9.381206906202268e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.245473712682724,
"step": 2885,
"valid_targets_mean": 2970.3,
"valid_targets_min": 452
},
{
"epoch": 4.982758620689655,
"grad_norm": 0.8822118338492542,
"learning_rate": 9.308447671028546e-06,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3259021043777466,
"step": 2890,
"valid_targets_mean": 2148.8,
"valid_targets_min": 566
},
{
"epoch": 4.991379310344827,
"grad_norm": 0.806073479088948,
"learning_rate": 9.235886015756579e-06,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970079481601715,
"step": 2895,
"valid_targets_mean": 2542.0,
"valid_targets_min": 707
},
{
"epoch": 5.0,
"grad_norm": 0.7534412948501094,
"learning_rate": 9.163523281325855e-06,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1989104300737381,
"step": 2900,
"valid_targets_mean": 2618.3,
"valid_targets_min": 660
},
{
"epoch": 5.008620689655173,
"grad_norm": 1.105096861322533,
"learning_rate": 9.09136080499979e-06,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033461630344391,
"step": 2905,
"valid_targets_mean": 2087.2,
"valid_targets_min": 621
},
{
"epoch": 5.017241379310345,
"grad_norm": 0.814355316956615,
"learning_rate": 9.019399920341056e-06,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2211400270462036,
"step": 2910,
"valid_targets_mean": 2302.2,
"valid_targets_min": 740
},
{
"epoch": 5.025862068965517,
"grad_norm": 0.7555369935442012,
"learning_rate": 8.947641957186901e-06,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22201001644134521,
"step": 2915,
"valid_targets_mean": 2680.2,
"valid_targets_min": 617
},
{
"epoch": 5.0344827586206895,
"grad_norm": 0.8780869760515323,
"learning_rate": 8.876088241624581e-06,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23922735452651978,
"step": 2920,
"valid_targets_mean": 2703.8,
"valid_targets_min": 727
},
{
"epoch": 5.043103448275862,
"grad_norm": 0.7990653658780432,
"learning_rate": 8.804740095966854e-06,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19045668840408325,
"step": 2925,
"valid_targets_mean": 2416.1,
"valid_targets_min": 580
},
{
"epoch": 5.051724137931035,
"grad_norm": 0.88230408527402,
"learning_rate": 8.733598838727559e-06,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37333962321281433,
"step": 2930,
"valid_targets_mean": 2585.8,
"valid_targets_min": 528
},
{
"epoch": 5.060344827586207,
"grad_norm": 0.6819112657231726,
"learning_rate": 8.662665784597229e-06,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23839415609836578,
"step": 2935,
"valid_targets_mean": 3358.6,
"valid_targets_min": 856
},
{
"epoch": 5.068965517241379,
"grad_norm": 0.8293484691002044,
"learning_rate": 8.591942244418787e-06,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19481952488422394,
"step": 2940,
"valid_targets_mean": 2366.5,
"valid_targets_min": 635
},
{
"epoch": 5.077586206896552,
"grad_norm": 0.7881892372101212,
"learning_rate": 8.521429525163353e-06,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24439600110054016,
"step": 2945,
"valid_targets_mean": 2869.0,
"valid_targets_min": 905
},
{
"epoch": 5.086206896551724,
"grad_norm": 0.8617105163860078,
"learning_rate": 8.451128929906103e-06,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24448537826538086,
"step": 2950,
"valid_targets_mean": 2538.8,
"valid_targets_min": 1034
},
{
"epoch": 5.094827586206897,
"grad_norm": 0.9667277337097181,
"learning_rate": 8.381041757802104e-06,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20713761448860168,
"step": 2955,
"valid_targets_mean": 1746.7,
"valid_targets_min": 454
},
{
"epoch": 5.103448275862069,
"grad_norm": 0.9687477914516257,
"learning_rate": 8.311169304062408e-06,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2437906712293625,
"step": 2960,
"valid_targets_mean": 2335.4,
"valid_targets_min": 716
},
{
"epoch": 5.112068965517241,
"grad_norm": 0.8722989954744373,
"learning_rate": 8.24151285993005e-06,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2599342167377472,
"step": 2965,
"valid_targets_mean": 2459.4,
"valid_targets_min": 864
},
{
"epoch": 5.120689655172414,
"grad_norm": 0.8167610619718768,
"learning_rate": 8.172073712656217e-06,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22704723477363586,
"step": 2970,
"valid_targets_mean": 2647.9,
"valid_targets_min": 409
},
{
"epoch": 5.129310344827586,
"grad_norm": 0.8851364961430449,
"learning_rate": 8.102853145476443e-06,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2630884647369385,
"step": 2975,
"valid_targets_mean": 1864.2,
"valid_targets_min": 753
},
{
"epoch": 5.137931034482759,
"grad_norm": 0.8571259105485494,
"learning_rate": 8.033852437586909e-06,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30201417207717896,
"step": 2980,
"valid_targets_mean": 2867.9,
"valid_targets_min": 675
},
{
"epoch": 5.146551724137931,
"grad_norm": 0.7274305622693614,
"learning_rate": 7.965072864120795e-06,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21190223097801208,
"step": 2985,
"valid_targets_mean": 3433.0,
"valid_targets_min": 862
},
{
"epoch": 5.155172413793103,
"grad_norm": 0.9890160470396074,
"learning_rate": 7.896515696124703e-06,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21601173281669617,
"step": 2990,
"valid_targets_mean": 1532.0,
"valid_targets_min": 461
},
{
"epoch": 5.163793103448276,
"grad_norm": 0.997039918531523,
"learning_rate": 7.828182200535192e-06,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23005810379981995,
"step": 2995,
"valid_targets_mean": 1639.2,
"valid_targets_min": 546
},
{
"epoch": 5.172413793103448,
"grad_norm": 0.6867188638921778,
"learning_rate": 7.760073640155363e-06,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2459755539894104,
"step": 3000,
"valid_targets_mean": 3401.4,
"valid_targets_min": 842
},
{
"epoch": 5.181034482758621,
"grad_norm": 0.6533351330245627,
"learning_rate": 7.6921912736315e-06,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.376540869474411,
"step": 3005,
"valid_targets_mean": 4465.1,
"valid_targets_min": 904
},
{
"epoch": 5.189655172413793,
"grad_norm": 0.8644740868223272,
"learning_rate": 7.624536355429832e-06,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22686511278152466,
"step": 3010,
"valid_targets_mean": 2452.3,
"valid_targets_min": 830
},
{
"epoch": 5.198275862068965,
"grad_norm": 0.7124035393064789,
"learning_rate": 7.557110135813341e-06,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3452039062976837,
"step": 3015,
"valid_targets_mean": 3736.2,
"valid_targets_min": 424
},
{
"epoch": 5.206896551724138,
"grad_norm": 0.7775149834470849,
"learning_rate": 7.489913860818662e-06,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.185041606426239,
"step": 3020,
"valid_targets_mean": 2617.4,
"valid_targets_min": 481
},
{
"epoch": 5.2155172413793105,
"grad_norm": 0.7965342418230602,
"learning_rate": 7.4229487722330315e-06,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30193090438842773,
"step": 3025,
"valid_targets_mean": 2663.9,
"valid_targets_min": 637
},
{
"epoch": 5.224137931034483,
"grad_norm": 0.7442252187409096,
"learning_rate": 7.356216107571399e-06,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.226355642080307,
"step": 3030,
"valid_targets_mean": 2999.0,
"valid_targets_min": 630
},
{
"epoch": 5.232758620689655,
"grad_norm": 0.8920967655645357,
"learning_rate": 7.289717100053497e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.274308443069458,
"step": 3035,
"valid_targets_mean": 2436.9,
"valid_targets_min": 848
},
{
"epoch": 5.241379310344827,
"grad_norm": 0.80538672065562,
"learning_rate": 7.2234529785810645e-06,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25805386900901794,
"step": 3040,
"valid_targets_mean": 2757.7,
"valid_targets_min": 479
},
{
"epoch": 5.25,
"grad_norm": 0.9390707357590979,
"learning_rate": 7.157424967715163e-06,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23520056903362274,
"step": 3045,
"valid_targets_mean": 1874.8,
"valid_targets_min": 635
},
{
"epoch": 5.258620689655173,
"grad_norm": 0.928924497701895,
"learning_rate": 7.091634287653526e-06,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29944998025894165,
"step": 3050,
"valid_targets_mean": 2415.0,
"valid_targets_min": 643
},
{
"epoch": 5.267241379310345,
"grad_norm": 0.9511943447002247,
"learning_rate": 7.026082154208012e-06,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21823076903820038,
"step": 3055,
"valid_targets_mean": 2298.8,
"valid_targets_min": 543
},
{
"epoch": 5.275862068965517,
"grad_norm": 0.8603536556942801,
"learning_rate": 6.960769778782133e-06,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770598232746124,
"step": 3060,
"valid_targets_mean": 2980.1,
"valid_targets_min": 978
},
{
"epoch": 5.2844827586206895,
"grad_norm": 0.8370012369788737,
"learning_rate": 6.89569836834868e-06,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24535402655601501,
"step": 3065,
"valid_targets_mean": 2859.5,
"valid_targets_min": 948
},
{
"epoch": 5.293103448275862,
"grad_norm": 0.7706085321244089,
"learning_rate": 6.830869125427406e-06,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22897306084632874,
"step": 3070,
"valid_targets_mean": 2896.3,
"valid_targets_min": 460
},
{
"epoch": 5.301724137931035,
"grad_norm": 0.9389137954620951,
"learning_rate": 6.766283248062817e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2493031620979309,
"step": 3075,
"valid_targets_mean": 1989.4,
"valid_targets_min": 569
},
{
"epoch": 5.310344827586207,
"grad_norm": 0.99461767506957,
"learning_rate": 6.701941929801996e-06,
"loss": 0.2394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2475142478942871,
"step": 3080,
"valid_targets_mean": 1796.1,
"valid_targets_min": 507
},
{
"epoch": 5.318965517241379,
"grad_norm": 0.8124459132077362,
"learning_rate": 6.637846359672611e-06,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2720719277858734,
"step": 3085,
"valid_targets_mean": 3237.2,
"valid_targets_min": 714
},
{
"epoch": 5.327586206896552,
"grad_norm": 0.8142226470682105,
"learning_rate": 6.57399772216089e-06,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31625697016716003,
"step": 3090,
"valid_targets_mean": 2509.7,
"valid_targets_min": 665
},
{
"epoch": 5.336206896551724,
"grad_norm": 0.9065141934251587,
"learning_rate": 6.510397197189724e-06,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21385717391967773,
"step": 3095,
"valid_targets_mean": 1814.4,
"valid_targets_min": 604
},
{
"epoch": 5.344827586206897,
"grad_norm": 0.7442529504808642,
"learning_rate": 6.447045960096909e-06,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17409583926200867,
"step": 3100,
"valid_targets_mean": 2769.3,
"valid_targets_min": 721
},
{
"epoch": 5.353448275862069,
"grad_norm": 0.7252146553291541,
"learning_rate": 6.383945181613398e-06,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2682117819786072,
"step": 3105,
"valid_targets_mean": 3152.5,
"valid_targets_min": 779
},
{
"epoch": 5.362068965517241,
"grad_norm": 0.8114618415473984,
"learning_rate": 6.32109602784166e-06,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23913054168224335,
"step": 3110,
"valid_targets_mean": 2647.9,
"valid_targets_min": 442
},
{
"epoch": 5.370689655172414,
"grad_norm": 1.051915605302084,
"learning_rate": 6.258499660234147e-06,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22146379947662354,
"step": 3115,
"valid_targets_mean": 1598.4,
"valid_targets_min": 239
},
{
"epoch": 5.379310344827586,
"grad_norm": 0.8789321218372114,
"learning_rate": 6.196157235571813e-06,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3028132915496826,
"step": 3120,
"valid_targets_mean": 2299.0,
"valid_targets_min": 636
},
{
"epoch": 5.387931034482759,
"grad_norm": 0.9372581236618194,
"learning_rate": 6.134069905942764e-06,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2093108743429184,
"step": 3125,
"valid_targets_mean": 2376.3,
"valid_targets_min": 920
},
{
"epoch": 5.396551724137931,
"grad_norm": 0.9140188518901189,
"learning_rate": 6.072238818720919e-06,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532634735107422,
"step": 3130,
"valid_targets_mean": 2265.4,
"valid_targets_min": 697
},
{
"epoch": 5.405172413793103,
"grad_norm": 0.7513197162873506,
"learning_rate": 6.010665116544858e-06,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515407204627991,
"step": 3135,
"valid_targets_mean": 3497.4,
"valid_targets_min": 925
},
{
"epoch": 5.413793103448276,
"grad_norm": 0.801555947638085,
"learning_rate": 5.9493499372967e-06,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2099888026714325,
"step": 3140,
"valid_targets_mean": 2794.4,
"valid_targets_min": 607
},
{
"epoch": 5.422413793103448,
"grad_norm": 0.9269899206555638,
"learning_rate": 5.888294414081024e-06,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532302141189575,
"step": 3145,
"valid_targets_mean": 1913.5,
"valid_targets_min": 430
},
{
"epoch": 5.431034482758621,
"grad_norm": 0.8973198139466191,
"learning_rate": 5.827499675203987e-06,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2676059603691101,
"step": 3150,
"valid_targets_mean": 2549.4,
"valid_targets_min": 463
},
{
"epoch": 5.439655172413793,
"grad_norm": 0.7944238364352102,
"learning_rate": 5.76696684415245e-06,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19005446135997772,
"step": 3155,
"valid_targets_mean": 2430.8,
"valid_targets_min": 556
},
{
"epoch": 5.448275862068965,
"grad_norm": 0.8242952463372876,
"learning_rate": 5.706697039573217e-06,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2020699828863144,
"step": 3160,
"valid_targets_mean": 2030.1,
"valid_targets_min": 462
},
{
"epoch": 5.456896551724138,
"grad_norm": 0.8901005474674238,
"learning_rate": 5.646691375252344e-06,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569023072719574,
"step": 3165,
"valid_targets_mean": 2169.4,
"valid_targets_min": 646
},
{
"epoch": 5.4655172413793105,
"grad_norm": 0.736018639158119,
"learning_rate": 5.586950960094606e-06,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18459513783454895,
"step": 3170,
"valid_targets_mean": 2561.8,
"valid_targets_min": 749
},
{
"epoch": 5.474137931034483,
"grad_norm": 0.8400494581096617,
"learning_rate": 5.527476898102959e-06,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21703600883483887,
"step": 3175,
"valid_targets_mean": 2296.8,
"valid_targets_min": 600
},
{
"epoch": 5.482758620689655,
"grad_norm": 0.8209437576909444,
"learning_rate": 5.4682702883581395e-06,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2574310600757599,
"step": 3180,
"valid_targets_mean": 2344.2,
"valid_targets_min": 690
},
{
"epoch": 5.491379310344827,
"grad_norm": 0.8182704176506642,
"learning_rate": 5.40933222499838e-06,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275604784488678,
"step": 3185,
"valid_targets_mean": 2814.9,
"valid_targets_min": 606
},
{
"epoch": 5.5,
"grad_norm": 0.8414281728930835,
"learning_rate": 5.350663797199174e-06,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21224384009838104,
"step": 3190,
"valid_targets_mean": 2361.4,
"valid_targets_min": 749
},
{
"epoch": 5.508620689655173,
"grad_norm": 0.7787724276238028,
"learning_rate": 5.292266089153149e-06,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23665933310985565,
"step": 3195,
"valid_targets_mean": 3440.9,
"valid_targets_min": 986
},
{
"epoch": 5.517241379310345,
"grad_norm": 0.9139485332508287,
"learning_rate": 5.234140180050029e-06,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.272885262966156,
"step": 3200,
"valid_targets_mean": 2132.9,
"valid_targets_min": 729
},
{
"epoch": 5.525862068965517,
"grad_norm": 0.6681187838459355,
"learning_rate": 5.1762871440566935e-06,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27599036693573,
"step": 3205,
"valid_targets_mean": 3626.7,
"valid_targets_min": 870
},
{
"epoch": 5.5344827586206895,
"grad_norm": 0.719024227101147,
"learning_rate": 5.118708050297332e-06,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3196202218532562,
"step": 3210,
"valid_targets_mean": 3611.8,
"valid_targets_min": 543
},
{
"epoch": 5.543103448275862,
"grad_norm": 0.73712058796339,
"learning_rate": 5.061403962833669e-06,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4145488142967224,
"step": 3215,
"valid_targets_mean": 3701.7,
"valid_targets_min": 580
},
{
"epoch": 5.551724137931035,
"grad_norm": 0.8563148070230047,
"learning_rate": 5.004375940645314e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751157283782959,
"step": 3220,
"valid_targets_mean": 2403.4,
"valid_targets_min": 648
},
{
"epoch": 5.560344827586206,
"grad_norm": 0.7955026427941279,
"learning_rate": 4.947625037610219e-06,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20612727105617523,
"step": 3225,
"valid_targets_mean": 2537.2,
"valid_targets_min": 549
},
{
"epoch": 5.568965517241379,
"grad_norm": 0.9987730788341107,
"learning_rate": 4.8911523024851295e-06,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2039443701505661,
"step": 3230,
"valid_targets_mean": 1640.1,
"valid_targets_min": 549
},
{
"epoch": 5.577586206896552,
"grad_norm": 0.8832700315040387,
"learning_rate": 4.834958778886271e-06,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25076743960380554,
"step": 3235,
"valid_targets_mean": 2207.8,
"valid_targets_min": 538
},
{
"epoch": 5.586206896551724,
"grad_norm": 0.9542645205391439,
"learning_rate": 4.779045505270043e-06,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26392078399658203,
"step": 3240,
"valid_targets_mean": 1774.3,
"valid_targets_min": 676
},
{
"epoch": 5.594827586206897,
"grad_norm": 0.7567347660293566,
"learning_rate": 4.723413514913817e-06,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2786219120025635,
"step": 3245,
"valid_targets_mean": 3309.2,
"valid_targets_min": 462
},
{
"epoch": 5.603448275862069,
"grad_norm": 0.6792209326601717,
"learning_rate": 4.66806383589685e-06,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.270943820476532,
"step": 3250,
"valid_targets_mean": 3717.2,
"valid_targets_min": 911
},
{
"epoch": 5.612068965517241,
"grad_norm": 0.7857291734419023,
"learning_rate": 4.6129974910812855e-06,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24094904959201813,
"step": 3255,
"valid_targets_mean": 2995.2,
"valid_targets_min": 644
},
{
"epoch": 5.620689655172414,
"grad_norm": 1.0235608686110846,
"learning_rate": 4.558215498093252e-06,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3251035213470459,
"step": 3260,
"valid_targets_mean": 1856.7,
"valid_targets_min": 662
},
{
"epoch": 5.629310344827586,
"grad_norm": 0.9351963793116751,
"learning_rate": 4.503718869304063e-06,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23973754048347473,
"step": 3265,
"valid_targets_mean": 2018.8,
"valid_targets_min": 616
},
{
"epoch": 5.637931034482759,
"grad_norm": 0.962954318386746,
"learning_rate": 4.449508611811482e-06,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40691524744033813,
"step": 3270,
"valid_targets_mean": 2582.0,
"valid_targets_min": 398
},
{
"epoch": 5.646551724137931,
"grad_norm": 0.8172013834884642,
"learning_rate": 4.395585727421139e-06,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3875260353088379,
"step": 3275,
"valid_targets_mean": 2692.9,
"valid_targets_min": 504
},
{
"epoch": 5.655172413793103,
"grad_norm": 0.8610903423900477,
"learning_rate": 4.341951212628031e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21040914952754974,
"step": 3280,
"valid_targets_mean": 2062.4,
"valid_targets_min": 611
},
{
"epoch": 5.663793103448276,
"grad_norm": 1.0523753196953791,
"learning_rate": 4.288606058598048e-06,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23646166920661926,
"step": 3285,
"valid_targets_mean": 2081.1,
"valid_targets_min": 617
},
{
"epoch": 5.672413793103448,
"grad_norm": 0.843692978853644,
"learning_rate": 4.235551251149714e-06,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20414787530899048,
"step": 3290,
"valid_targets_mean": 2991.9,
"valid_targets_min": 790
},
{
"epoch": 5.681034482758621,
"grad_norm": 0.8451079144051367,
"learning_rate": 4.1827877707359474e-06,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31735336780548096,
"step": 3295,
"valid_targets_mean": 3041.9,
"valid_targets_min": 707
},
{
"epoch": 5.689655172413794,
"grad_norm": 0.8078901356285255,
"learning_rate": 4.130316592425934e-06,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23267899453639984,
"step": 3300,
"valid_targets_mean": 2777.6,
"valid_targets_min": 654
},
{
"epoch": 5.698275862068965,
"grad_norm": 0.8571064223274443,
"learning_rate": 4.078138685887125e-06,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22103667259216309,
"step": 3305,
"valid_targets_mean": 2645.8,
"valid_targets_min": 448
},
{
"epoch": 5.706896551724138,
"grad_norm": 0.8230034928760354,
"learning_rate": 4.026255015367302e-06,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21825623512268066,
"step": 3310,
"valid_targets_mean": 2551.1,
"valid_targets_min": 343
},
{
"epoch": 5.7155172413793105,
"grad_norm": 1.0239665276979915,
"learning_rate": 3.974666539676774e-06,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24945151805877686,
"step": 3315,
"valid_targets_mean": 1659.0,
"valid_targets_min": 526
},
{
"epoch": 5.724137931034483,
"grad_norm": 1.0776616704513493,
"learning_rate": 3.923374212170634e-06,
"loss": 0.2431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2398718148469925,
"step": 3320,
"valid_targets_mean": 1804.1,
"valid_targets_min": 599
},
{
"epoch": 5.732758620689655,
"grad_norm": 1.016789683397506,
"learning_rate": 3.872378980731168e-06,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22868318855762482,
"step": 3325,
"valid_targets_mean": 1696.4,
"valid_targets_min": 365
},
{
"epoch": 5.741379310344827,
"grad_norm": 0.822562726856188,
"learning_rate": 3.821681787750327e-06,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.319583535194397,
"step": 3330,
"valid_targets_mean": 2791.6,
"valid_targets_min": 561
},
{
"epoch": 5.75,
"grad_norm": 0.8374432974605485,
"learning_rate": 3.7712835701122985e-06,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27780675888061523,
"step": 3335,
"valid_targets_mean": 2587.7,
"valid_targets_min": 584
},
{
"epoch": 5.758620689655173,
"grad_norm": 0.8238659716528866,
"learning_rate": 3.721185259176223e-06,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24886605143547058,
"step": 3340,
"valid_targets_mean": 2995.2,
"valid_targets_min": 758
},
{
"epoch": 5.767241379310345,
"grad_norm": 0.9083332235947693,
"learning_rate": 3.6713877807589503e-06,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25362688302993774,
"step": 3345,
"valid_targets_mean": 2286.2,
"valid_targets_min": 578
},
{
"epoch": 5.775862068965517,
"grad_norm": 0.7791354120068396,
"learning_rate": 3.621892055117955e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2154545933008194,
"step": 3350,
"valid_targets_mean": 2828.0,
"valid_targets_min": 664
},
{
"epoch": 5.7844827586206895,
"grad_norm": 0.7390189719309704,
"learning_rate": 3.572698996934303e-06,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2241281419992447,
"step": 3355,
"valid_targets_mean": 3631.4,
"valid_targets_min": 871
},
{
"epoch": 5.793103448275862,
"grad_norm": 0.8756183555419305,
"learning_rate": 3.5238095152957906e-06,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29824498295783997,
"step": 3360,
"valid_targets_mean": 2598.0,
"valid_targets_min": 495
},
{
"epoch": 5.801724137931035,
"grad_norm": 0.9337227488178528,
"learning_rate": 3.4752245136801065e-06,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24506528675556183,
"step": 3365,
"valid_targets_mean": 2258.9,
"valid_targets_min": 878
},
{
"epoch": 5.810344827586206,
"grad_norm": 1.0890649426704166,
"learning_rate": 3.4269448899381354e-06,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2098155915737152,
"step": 3370,
"valid_targets_mean": 2132.2,
"valid_targets_min": 837
},
{
"epoch": 5.818965517241379,
"grad_norm": 0.9953523310912673,
"learning_rate": 3.3789715362773955e-06,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24397800862789154,
"step": 3375,
"valid_targets_mean": 1919.3,
"valid_targets_min": 752
},
{
"epoch": 5.827586206896552,
"grad_norm": 0.9040669773305245,
"learning_rate": 3.3313053392455317e-06,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2670442461967468,
"step": 3380,
"valid_targets_mean": 2793.4,
"valid_targets_min": 854
},
{
"epoch": 5.836206896551724,
"grad_norm": 0.8329381538145997,
"learning_rate": 3.2839471797139287e-06,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24865490198135376,
"step": 3385,
"valid_targets_mean": 3038.6,
"valid_targets_min": 734
},
{
"epoch": 5.844827586206897,
"grad_norm": 0.9337244826069802,
"learning_rate": 3.236897932861438e-06,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2127501517534256,
"step": 3390,
"valid_targets_mean": 1871.8,
"valid_targets_min": 389
},
{
"epoch": 5.853448275862069,
"grad_norm": 0.7431219731060789,
"learning_rate": 3.190158468158209e-06,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20985054969787598,
"step": 3395,
"valid_targets_mean": 3339.9,
"valid_targets_min": 572
},
{
"epoch": 5.862068965517241,
"grad_norm": 0.7365106247265166,
"learning_rate": 3.1437296493496183e-06,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18149128556251526,
"step": 3400,
"valid_targets_mean": 2524.5,
"valid_targets_min": 531
},
{
"epoch": 5.870689655172414,
"grad_norm": 0.7285497403315008,
"learning_rate": 3.0976123344402897e-06,
"loss": 0.2312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19571764767169952,
"step": 3405,
"valid_targets_mean": 2929.2,
"valid_targets_min": 1012
},
{
"epoch": 5.879310344827586,
"grad_norm": 0.8446091784157775,
"learning_rate": 3.0518073756782683e-06,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21701383590698242,
"step": 3410,
"valid_targets_mean": 2557.4,
"valid_targets_min": 668
},
{
"epoch": 5.887931034482759,
"grad_norm": 0.8379682725324452,
"learning_rate": 3.0063156195392685e-06,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22046051919460297,
"step": 3415,
"valid_targets_mean": 2508.8,
"valid_targets_min": 1004
},
{
"epoch": 5.896551724137931,
"grad_norm": 0.823916206620456,
"learning_rate": 2.9611379067109914e-06,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25937724113464355,
"step": 3420,
"valid_targets_mean": 2341.8,
"valid_targets_min": 603
},
{
"epoch": 5.905172413793103,
"grad_norm": 0.8688927625576043,
"learning_rate": 2.9162750720776366e-06,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20510298013687134,
"step": 3425,
"valid_targets_mean": 2424.8,
"valid_targets_min": 684
},
{
"epoch": 5.913793103448276,
"grad_norm": 0.8413675713303786,
"learning_rate": 2.871727944704452e-06,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2330384999513626,
"step": 3430,
"valid_targets_mean": 2494.5,
"valid_targets_min": 707
},
{
"epoch": 5.922413793103448,
"grad_norm": 0.8731479034508837,
"learning_rate": 2.8274973478224167e-06,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21474598348140717,
"step": 3435,
"valid_targets_mean": 1941.6,
"valid_targets_min": 743
},
{
"epoch": 5.931034482758621,
"grad_norm": 0.7949398908604771,
"learning_rate": 2.783584098813006e-06,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21405553817749023,
"step": 3440,
"valid_targets_mean": 2754.8,
"valid_targets_min": 1074
},
{
"epoch": 5.939655172413794,
"grad_norm": 0.6099875987527934,
"learning_rate": 2.739989009193138e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19622787833213806,
"step": 3445,
"valid_targets_mean": 3920.4,
"valid_targets_min": 737
},
{
"epoch": 5.948275862068965,
"grad_norm": 0.8887479983547679,
"learning_rate": 2.6967128846001234e-06,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22184374928474426,
"step": 3450,
"valid_targets_mean": 2611.6,
"valid_targets_min": 678
},
{
"epoch": 5.956896551724138,
"grad_norm": 0.762426985169917,
"learning_rate": 2.6537565247768094e-06,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22541582584381104,
"step": 3455,
"valid_targets_mean": 2869.6,
"valid_targets_min": 607
},
{
"epoch": 5.9655172413793105,
"grad_norm": 0.7213697453294076,
"learning_rate": 2.611120723556775e-06,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19540910422801971,
"step": 3460,
"valid_targets_mean": 3429.9,
"valid_targets_min": 474
},
{
"epoch": 5.974137931034483,
"grad_norm": 0.8288431420947139,
"learning_rate": 2.568806268849684e-06,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3504294455051422,
"step": 3465,
"valid_targets_mean": 3034.3,
"valid_targets_min": 497
},
{
"epoch": 5.982758620689655,
"grad_norm": 0.8835454906756263,
"learning_rate": 2.526813942626736e-06,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22182214260101318,
"step": 3470,
"valid_targets_mean": 2302.6,
"valid_targets_min": 437
},
{
"epoch": 5.991379310344827,
"grad_norm": 0.971771312176322,
"learning_rate": 2.4851445209061574e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23820282518863678,
"step": 3475,
"valid_targets_mean": 2441.9,
"valid_targets_min": 689
},
{
"epoch": 6.0,
"grad_norm": 0.9859173949074006,
"learning_rate": 2.4437987737389277e-06,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3061915636062622,
"step": 3480,
"valid_targets_mean": 1670.5,
"valid_targets_min": 521
},
{
"epoch": 6.008620689655173,
"grad_norm": 0.8259796364563601,
"learning_rate": 2.40277746519451e-06,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662147283554077,
"step": 3485,
"valid_targets_mean": 2172.5,
"valid_targets_min": 967
},
{
"epoch": 6.017241379310345,
"grad_norm": 0.8122390172067061,
"learning_rate": 2.362081353346746e-06,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3083020746707916,
"step": 3490,
"valid_targets_mean": 2627.9,
"valid_targets_min": 651
},
{
"epoch": 6.025862068965517,
"grad_norm": 0.8572002021748207,
"learning_rate": 2.3217111902598298e-06,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1962701827287674,
"step": 3495,
"valid_targets_mean": 2450.2,
"valid_targets_min": 786
},
{
"epoch": 6.0344827586206895,
"grad_norm": 0.7183758223798724,
"learning_rate": 2.2816677219744388e-06,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1775016337633133,
"step": 3500,
"valid_targets_mean": 3416.1,
"valid_targets_min": 425
},
{
"epoch": 6.043103448275862,
"grad_norm": 0.8569666247164796,
"learning_rate": 2.241951688493924e-06,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2090853452682495,
"step": 3505,
"valid_targets_mean": 2665.7,
"valid_targets_min": 937
},
{
"epoch": 6.051724137931035,
"grad_norm": 0.7083072713399716,
"learning_rate": 2.2025638237706294e-06,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21648496389389038,
"step": 3510,
"valid_targets_mean": 3468.3,
"valid_targets_min": 595
},
{
"epoch": 6.060344827586207,
"grad_norm": 0.7616299153165997,
"learning_rate": 2.1635048556923555e-06,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3211386799812317,
"step": 3515,
"valid_targets_mean": 3530.7,
"valid_targets_min": 725
},
{
"epoch": 6.068965517241379,
"grad_norm": 0.8144597761169627,
"learning_rate": 2.1247755060688856e-06,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2765442728996277,
"step": 3520,
"valid_targets_mean": 2601.8,
"valid_targets_min": 620
},
{
"epoch": 6.077586206896552,
"grad_norm": 0.8808259389489778,
"learning_rate": 2.0863764906186514e-06,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18842661380767822,
"step": 3525,
"valid_targets_mean": 2145.4,
"valid_targets_min": 663
},
{
"epoch": 6.086206896551724,
"grad_norm": 0.7029072678359862,
"learning_rate": 2.048308518955515e-06,
"loss": 0.2031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.236032634973526,
"step": 3530,
"valid_targets_mean": 2771.7,
"valid_targets_min": 668
},
{
"epoch": 6.094827586206897,
"grad_norm": 0.9491045420303452,
"learning_rate": 2.010572294575641e-06,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2161491960287094,
"step": 3535,
"valid_targets_mean": 2009.6,
"valid_targets_min": 633
},
{
"epoch": 6.103448275862069,
"grad_norm": 0.6859005396721884,
"learning_rate": 1.9731685148445168e-06,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22911563515663147,
"step": 3540,
"valid_targets_mean": 3666.6,
"valid_targets_min": 524
},
{
"epoch": 6.112068965517241,
"grad_norm": 0.9557415355225928,
"learning_rate": 1.9360978709840304e-06,
"loss": 0.2133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21899035573005676,
"step": 3545,
"valid_targets_mean": 1906.8,
"valid_targets_min": 468
},
{
"epoch": 6.120689655172414,
"grad_norm": 0.909071489081533,
"learning_rate": 1.8993610480597359e-06,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24376355111598969,
"step": 3550,
"valid_targets_mean": 2097.9,
"valid_targets_min": 523
},
{
"epoch": 6.129310344827586,
"grad_norm": 0.8247316406377753,
"learning_rate": 1.8629587249681802e-06,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19326910376548767,
"step": 3555,
"valid_targets_mean": 2371.6,
"valid_targets_min": 647
},
{
"epoch": 6.137931034482759,
"grad_norm": 0.7254426351650269,
"learning_rate": 1.8268915744243321e-06,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21975982189178467,
"step": 3560,
"valid_targets_mean": 2966.4,
"valid_targets_min": 645
},
{
"epoch": 6.146551724137931,
"grad_norm": 0.9361941902410946,
"learning_rate": 1.7911602629491876e-06,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509339451789856,
"step": 3565,
"valid_targets_mean": 1950.9,
"valid_targets_min": 390
},
{
"epoch": 6.155172413793103,
"grad_norm": 0.7228613254495483,
"learning_rate": 1.7557654508574339e-06,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20333698391914368,
"step": 3570,
"valid_targets_mean": 3122.8,
"valid_targets_min": 754
},
{
"epoch": 6.163793103448276,
"grad_norm": 1.0020794026321742,
"learning_rate": 1.7207077922452465e-06,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.210041344165802,
"step": 3575,
"valid_targets_mean": 2465.9,
"valid_targets_min": 549
},
{
"epoch": 6.172413793103448,
"grad_norm": 0.8798123178752363,
"learning_rate": 1.6859879349782016e-06,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18440866470336914,
"step": 3580,
"valid_targets_mean": 2341.3,
"valid_targets_min": 449
},
{
"epoch": 6.181034482758621,
"grad_norm": 0.8483923006765547,
"learning_rate": 1.6516065206793142e-06,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22888490557670593,
"step": 3585,
"valid_targets_mean": 2786.9,
"valid_targets_min": 670
},
{
"epoch": 6.189655172413793,
"grad_norm": 0.6647533942461221,
"learning_rate": 1.6175641847171687e-06,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13367384672164917,
"step": 3590,
"valid_targets_mean": 2980.8,
"valid_targets_min": 528
},
{
"epoch": 6.198275862068965,
"grad_norm": 0.7683054390842444,
"learning_rate": 1.5838615561941705e-06,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20049786567687988,
"step": 3595,
"valid_targets_mean": 3060.6,
"valid_targets_min": 651
},
{
"epoch": 6.206896551724138,
"grad_norm": 0.7673616808413553,
"learning_rate": 1.550499257934952e-06,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25009968876838684,
"step": 3600,
"valid_targets_mean": 2919.8,
"valid_targets_min": 1283
},
{
"epoch": 6.2155172413793105,
"grad_norm": 0.9320141925380155,
"learning_rate": 1.5174779064748246e-06,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25595584511756897,
"step": 3605,
"valid_targets_mean": 2494.9,
"valid_targets_min": 528
},
{
"epoch": 6.224137931034483,
"grad_norm": 0.793005521065028,
"learning_rate": 1.4847981120484089e-06,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2183004915714264,
"step": 3610,
"valid_targets_mean": 2551.4,
"valid_targets_min": 675
},
{
"epoch": 6.232758620689655,
"grad_norm": 0.984122982728532,
"learning_rate": 1.4524604785783548e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24975597858428955,
"step": 3615,
"valid_targets_mean": 2036.0,
"valid_targets_min": 616
},
{
"epoch": 6.241379310344827,
"grad_norm": 1.0714043895025145,
"learning_rate": 1.4204656036641717e-06,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23043999075889587,
"step": 3620,
"valid_targets_mean": 1476.6,
"valid_targets_min": 511
},
{
"epoch": 6.25,
"grad_norm": 0.7599854368014449,
"learning_rate": 1.3888140785711945e-06,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2328336238861084,
"step": 3625,
"valid_targets_mean": 2807.8,
"valid_targets_min": 568
},
{
"epoch": 6.258620689655173,
"grad_norm": 0.7886353552490163,
"learning_rate": 1.3575064882196398e-06,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25991952419281006,
"step": 3630,
"valid_targets_mean": 2783.3,
"valid_targets_min": 662
},
{
"epoch": 6.267241379310345,
"grad_norm": 0.8249182347946712,
"learning_rate": 1.326543411173833e-06,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4094190299510956,
"step": 3635,
"valid_targets_mean": 2826.6,
"valid_targets_min": 797
},
{
"epoch": 6.275862068965517,
"grad_norm": 0.8263338135104763,
"learning_rate": 1.295925419631474e-06,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25934290885925293,
"step": 3640,
"valid_targets_mean": 2836.1,
"valid_targets_min": 1184
},
{
"epoch": 6.2844827586206895,
"grad_norm": 0.8722859174332926,
"learning_rate": 1.265653079413094e-06,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21666531264781952,
"step": 3645,
"valid_targets_mean": 2185.1,
"valid_targets_min": 860
},
{
"epoch": 6.293103448275862,
"grad_norm": 0.7035939411346323,
"learning_rate": 1.2357269499515745e-06,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17183193564414978,
"step": 3650,
"valid_targets_mean": 2954.5,
"valid_targets_min": 583
},
{
"epoch": 6.301724137931035,
"grad_norm": 0.8560939981440374,
"learning_rate": 1.2061475842818337e-06,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16396474838256836,
"step": 3655,
"valid_targets_mean": 2264.4,
"valid_targets_min": 546
},
{
"epoch": 6.310344827586207,
"grad_norm": 0.8276157933772642,
"learning_rate": 1.176915529030589e-06,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20803743600845337,
"step": 3660,
"valid_targets_mean": 2581.9,
"valid_targets_min": 631
},
{
"epoch": 6.318965517241379,
"grad_norm": 0.8825248792003373,
"learning_rate": 1.1480313244062603e-06,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19510574638843536,
"step": 3665,
"valid_targets_mean": 2983.0,
"valid_targets_min": 549
},
{
"epoch": 6.327586206896552,
"grad_norm": 1.0603206638893432,
"learning_rate": 1.1194955041889898e-06,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4232352674007416,
"step": 3670,
"valid_targets_mean": 2577.1,
"valid_targets_min": 659
},
{
"epoch": 6.336206896551724,
"grad_norm": 0.654952681959888,
"learning_rate": 1.0913085957207748e-06,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16756662726402283,
"step": 3675,
"valid_targets_mean": 3552.1,
"valid_targets_min": 661
},
{
"epoch": 6.344827586206897,
"grad_norm": 0.7777566470051069,
"learning_rate": 1.063471119895727e-06,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24378885328769684,
"step": 3680,
"valid_targets_mean": 2565.6,
"valid_targets_min": 809
},
{
"epoch": 6.353448275862069,
"grad_norm": 0.8061803441107526,
"learning_rate": 1.0359835911504246e-06,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18783554434776306,
"step": 3685,
"valid_targets_mean": 2660.6,
"valid_targets_min": 625
},
{
"epoch": 6.362068965517241,
"grad_norm": 0.902717438655001,
"learning_rate": 1.0088465174544514e-06,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22732427716255188,
"step": 3690,
"valid_targets_mean": 2514.8,
"valid_targets_min": 676
},
{
"epoch": 6.370689655172414,
"grad_norm": 0.8330379786967017,
"learning_rate": 9.820604003009614e-07,
"loss": 0.2394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19690130650997162,
"step": 3695,
"valid_targets_mean": 2417.4,
"valid_targets_min": 721
},
{
"epoch": 6.379310344827586,
"grad_norm": 0.8657508340163629,
"learning_rate": 9.556257346974319e-07,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20571178197860718,
"step": 3700,
"valid_targets_mean": 2392.0,
"valid_targets_min": 980
},
{
"epoch": 6.387931034482759,
"grad_norm": 0.9078987585519426,
"learning_rate": 9.295430091565261e-07,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16755205392837524,
"step": 3705,
"valid_targets_mean": 2038.2,
"valid_targets_min": 583
},
{
"epoch": 6.396551724137931,
"grad_norm": 0.6660952264268134,
"learning_rate": 9.038127056870416e-07,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19638925790786743,
"step": 3710,
"valid_targets_mean": 3692.2,
"valid_targets_min": 600
},
{
"epoch": 6.405172413793103,
"grad_norm": 0.6483874159711565,
"learning_rate": 8.784352997850277e-07,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2156984508037567,
"step": 3715,
"valid_targets_mean": 3738.2,
"valid_targets_min": 352
},
{
"epoch": 6.413793103448276,
"grad_norm": 1.1860093859601488,
"learning_rate": 8.534112604249789e-07,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21328943967819214,
"step": 3720,
"valid_targets_mean": 1351.2,
"valid_targets_min": 498
},
{
"epoch": 6.422413793103448,
"grad_norm": 0.9595913540187618,
"learning_rate": 8.287410500511739e-07,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24893982708454132,
"step": 3725,
"valid_targets_mean": 1926.8,
"valid_targets_min": 497
},
{
"epoch": 6.431034482758621,
"grad_norm": 0.6243254247221967,
"learning_rate": 8.044251245691393e-07,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19777286052703857,
"step": 3730,
"valid_targets_mean": 4638.8,
"valid_targets_min": 695
},
{
"epoch": 6.439655172413793,
"grad_norm": 1.0201483178932162,
"learning_rate": 7.804639333372077e-07,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19841013848781586,
"step": 3735,
"valid_targets_mean": 1597.1,
"valid_targets_min": 535
},
{
"epoch": 6.448275862068965,
"grad_norm": 0.6715125124145136,
"learning_rate": 7.568579191582248e-07,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15024380385875702,
"step": 3740,
"valid_targets_mean": 3333.9,
"valid_targets_min": 722
},
{
"epoch": 6.456896551724138,
"grad_norm": 0.9225692501156839,
"learning_rate": 7.336075182713708e-07,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18564382195472717,
"step": 3745,
"valid_targets_mean": 1924.0,
"valid_targets_min": 567
},
{
"epoch": 6.4655172413793105,
"grad_norm": 0.8431848482827717,
"learning_rate": 7.107131603440809e-07,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24477818608283997,
"step": 3750,
"valid_targets_mean": 2608.8,
"valid_targets_min": 864
},
{
"epoch": 6.474137931034483,
"grad_norm": 0.8890579364206326,
"learning_rate": 6.881752684641219e-07,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23633387684822083,
"step": 3755,
"valid_targets_mean": 2135.5,
"valid_targets_min": 501
},
{
"epoch": 6.482758620689655,
"grad_norm": 0.9418285611708161,
"learning_rate": 6.659942591317703e-07,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21280354261398315,
"step": 3760,
"valid_targets_mean": 2341.2,
"valid_targets_min": 730
},
{
"epoch": 6.491379310344827,
"grad_norm": 0.8030498311605387,
"learning_rate": 6.441705422521072e-07,
"loss": 0.2343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3081728518009186,
"step": 3765,
"valid_targets_mean": 2511.6,
"valid_targets_min": 390
},
{
"epoch": 6.5,
"grad_norm": 0.5943846941535217,
"learning_rate": 6.22704521127444e-07,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15976674854755402,
"step": 3770,
"valid_targets_mean": 3873.2,
"valid_targets_min": 561
},
{
"epoch": 6.508620689655173,
"grad_norm": 1.0891839401674237,
"learning_rate": 6.015965924498912e-07,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21925121545791626,
"step": 3775,
"valid_targets_mean": 1394.6,
"valid_targets_min": 463
},
{
"epoch": 6.517241379310345,
"grad_norm": 0.8599544341446648,
"learning_rate": 5.808471462939946e-07,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16710597276687622,
"step": 3780,
"valid_targets_mean": 2198.5,
"valid_targets_min": 554
},
{
"epoch": 6.525862068965517,
"grad_norm": 0.7814752595407828,
"learning_rate": 5.604565661095484e-07,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16703981161117554,
"step": 3785,
"valid_targets_mean": 2364.4,
"valid_targets_min": 667
},
{
"epoch": 6.5344827586206895,
"grad_norm": 0.8041080575361683,
"learning_rate": 5.404252287145006e-07,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21759355068206787,
"step": 3790,
"valid_targets_mean": 2688.5,
"valid_targets_min": 758
},
{
"epoch": 6.543103448275862,
"grad_norm": 0.8965876942311776,
"learning_rate": 5.207535042879963e-07,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28278952836990356,
"step": 3795,
"valid_targets_mean": 2443.2,
"valid_targets_min": 1188
},
{
"epoch": 6.551724137931035,
"grad_norm": 0.9071674222059003,
"learning_rate": 5.014417563635276e-07,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25929227471351624,
"step": 3800,
"valid_targets_mean": 2408.9,
"valid_targets_min": 607
},
{
"epoch": 6.560344827586206,
"grad_norm": 0.8831685374142777,
"learning_rate": 4.824903418222259e-07,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19960355758666992,
"step": 3805,
"valid_targets_mean": 2117.8,
"valid_targets_min": 662
},
{
"epoch": 6.568965517241379,
"grad_norm": 0.8961223958340995,
"learning_rate": 4.638996108862559e-07,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22452160716056824,
"step": 3810,
"valid_targets_mean": 2288.6,
"valid_targets_min": 698
},
{
"epoch": 6.577586206896552,
"grad_norm": 1.0638472212212051,
"learning_rate": 4.456699071123538e-07,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24735592305660248,
"step": 3815,
"valid_targets_mean": 1975.4,
"valid_targets_min": 442
},
{
"epoch": 6.586206896551724,
"grad_norm": 0.8474618730147804,
"learning_rate": 4.2780156738546407e-07,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27747148275375366,
"step": 3820,
"valid_targets_mean": 2450.4,
"valid_targets_min": 433
},
{
"epoch": 6.594827586206897,
"grad_norm": 0.8280145715710722,
"learning_rate": 4.1029492191253296e-07,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3170340657234192,
"step": 3825,
"valid_targets_mean": 3543.2,
"valid_targets_min": 522
},
{
"epoch": 6.603448275862069,
"grad_norm": 0.8420428298122106,
"learning_rate": 3.931502942163956e-07,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18059438467025757,
"step": 3830,
"valid_targets_mean": 2666.2,
"valid_targets_min": 405
},
{
"epoch": 6.612068965517241,
"grad_norm": 0.7350163043675808,
"learning_rate": 3.763680011297921e-07,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26293593645095825,
"step": 3835,
"valid_targets_mean": 2851.2,
"valid_targets_min": 642
},
{
"epoch": 6.620689655172414,
"grad_norm": 0.6594635552982795,
"learning_rate": 3.599483527895231e-07,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16505607962608337,
"step": 3840,
"valid_targets_mean": 3067.9,
"valid_targets_min": 753
},
{
"epoch": 6.629310344827586,
"grad_norm": 0.9184961795467407,
"learning_rate": 3.4389165263071233e-07,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21113553643226624,
"step": 3845,
"valid_targets_mean": 2008.4,
"valid_targets_min": 388
},
{
"epoch": 6.637931034482759,
"grad_norm": 0.7364720588352186,
"learning_rate": 3.2819819738119983e-07,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.306973397731781,
"step": 3850,
"valid_targets_mean": 3472.8,
"valid_targets_min": 591
},
{
"epoch": 6.646551724137931,
"grad_norm": 0.93393457736903,
"learning_rate": 3.1286827705605984e-07,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20894655585289001,
"step": 3855,
"valid_targets_mean": 1776.7,
"valid_targets_min": 877
},
{
"epoch": 6.655172413793103,
"grad_norm": 0.8524518408875474,
"learning_rate": 2.979021749522448e-07,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16892358660697937,
"step": 3860,
"valid_targets_mean": 2273.3,
"valid_targets_min": 595
},
{
"epoch": 6.663793103448276,
"grad_norm": 0.7130380541280331,
"learning_rate": 2.833001676433367e-07,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.213408425450325,
"step": 3865,
"valid_targets_mean": 3203.2,
"valid_targets_min": 521
},
{
"epoch": 6.672413793103448,
"grad_norm": 0.7018261489432114,
"learning_rate": 2.690625249744572e-07,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31899774074554443,
"step": 3870,
"valid_targets_mean": 3903.7,
"valid_targets_min": 679
},
{
"epoch": 6.681034482758621,
"grad_norm": 0.6418700087130179,
"learning_rate": 2.551895100572566e-07,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16666455566883087,
"step": 3875,
"valid_targets_mean": 3481.6,
"valid_targets_min": 1271
},
{
"epoch": 6.689655172413794,
"grad_norm": 0.8733028268705049,
"learning_rate": 2.4168137926506854e-07,
"loss": 0.2288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2073197364807129,
"step": 3880,
"valid_targets_mean": 2392.1,
"valid_targets_min": 633
},
{
"epoch": 6.698275862068965,
"grad_norm": 0.7901410728478923,
"learning_rate": 2.2853838222817616e-07,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1996878683567047,
"step": 3885,
"valid_targets_mean": 2705.2,
"valid_targets_min": 586
},
{
"epoch": 6.706896551724138,
"grad_norm": 0.8946238203625446,
"learning_rate": 2.1576076182917794e-07,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23879259824752808,
"step": 3890,
"valid_targets_mean": 2460.6,
"valid_targets_min": 687
},
{
"epoch": 6.7155172413793105,
"grad_norm": 0.7680521503043941,
"learning_rate": 2.0334875419851573e-07,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21219167113304138,
"step": 3895,
"valid_targets_mean": 3066.4,
"valid_targets_min": 590
},
{
"epoch": 6.724137931034483,
"grad_norm": 0.936457613376202,
"learning_rate": 1.9130258871011165e-07,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3052334785461426,
"step": 3900,
"valid_targets_mean": 2051.9,
"valid_targets_min": 763
},
{
"epoch": 6.732758620689655,
"grad_norm": 1.0475766339583639,
"learning_rate": 1.7962248797711356e-07,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21644529700279236,
"step": 3905,
"valid_targets_mean": 1918.8,
"valid_targets_min": 726
},
{
"epoch": 6.741379310344827,
"grad_norm": 0.8637115483109303,
"learning_rate": 1.683086678478074e-07,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22499002516269684,
"step": 3910,
"valid_targets_mean": 2219.4,
"valid_targets_min": 523
},
{
"epoch": 6.75,
"grad_norm": 1.0651120829370146,
"learning_rate": 1.573613374015981e-07,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26293978095054626,
"step": 3915,
"valid_targets_mean": 1706.4,
"valid_targets_min": 615
},
{
"epoch": 6.758620689655173,
"grad_norm": 0.761333315392171,
"learning_rate": 1.4678069894517033e-07,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542230784893036,
"step": 3920,
"valid_targets_mean": 3023.2,
"valid_targets_min": 713
},
{
"epoch": 6.767241379310345,
"grad_norm": 0.8423961598753894,
"learning_rate": 1.3656694800873614e-07,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2205635905265808,
"step": 3925,
"valid_targets_mean": 2509.8,
"valid_targets_min": 853
},
{
"epoch": 6.775862068965517,
"grad_norm": 0.916211614133893,
"learning_rate": 1.2672027334242887e-07,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20351552963256836,
"step": 3930,
"valid_targets_mean": 2471.0,
"valid_targets_min": 846
},
{
"epoch": 6.7844827586206895,
"grad_norm": 0.7579473459759021,
"learning_rate": 1.1724085691280806e-07,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18758231401443481,
"step": 3935,
"valid_targets_mean": 2898.5,
"valid_targets_min": 903
},
{
"epoch": 6.793103448275862,
"grad_norm": 0.8231434675312551,
"learning_rate": 1.0812887389950233e-07,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19742494821548462,
"step": 3940,
"valid_targets_mean": 2438.4,
"valid_targets_min": 640
},
{
"epoch": 6.801724137931035,
"grad_norm": 0.9628228148144512,
"learning_rate": 9.938449269197181e-08,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23039749264717102,
"step": 3945,
"valid_targets_mean": 1953.7,
"valid_targets_min": 761
},
{
"epoch": 6.810344827586206,
"grad_norm": 0.7894870509582401,
"learning_rate": 9.100787488639295e-08,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916305363178253,
"step": 3950,
"valid_targets_mean": 3440.9,
"valid_targets_min": 1027
},
{
"epoch": 6.818965517241379,
"grad_norm": 0.7395599333644957,
"learning_rate": 8.299917528267198e-08,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22837454080581665,
"step": 3955,
"valid_targets_mean": 3526.9,
"valid_targets_min": 715
},
{
"epoch": 6.827586206896552,
"grad_norm": 0.8811432377167411,
"learning_rate": 7.535854188159164e-08,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23188039660453796,
"step": 3960,
"valid_targets_mean": 2747.4,
"valid_targets_min": 989
},
{
"epoch": 6.836206896551724,
"grad_norm": 0.8304476063590915,
"learning_rate": 6.808611588206448e-08,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31357303261756897,
"step": 3965,
"valid_targets_mean": 2781.1,
"valid_targets_min": 795
},
{
"epoch": 6.844827586206897,
"grad_norm": 0.8993994292302855,
"learning_rate": 6.11820316785372e-08,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24727486073970795,
"step": 3970,
"valid_targets_mean": 2601.2,
"valid_targets_min": 527
},
{
"epoch": 6.853448275862069,
"grad_norm": 0.9830591762448566,
"learning_rate": 5.464641685849259e-08,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2648414969444275,
"step": 3975,
"valid_targets_mean": 2094.7,
"valid_targets_min": 409
},
{
"epoch": 6.862068965517241,
"grad_norm": 1.0086942806515675,
"learning_rate": 4.8479392200100336e-08,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2471552938222885,
"step": 3980,
"valid_targets_mean": 2030.5,
"valid_targets_min": 781
},
{
"epoch": 6.870689655172414,
"grad_norm": 0.8571957254541847,
"learning_rate": 4.268107166998769e-08,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24853479862213135,
"step": 3985,
"valid_targets_mean": 2415.8,
"valid_targets_min": 814
},
{
"epoch": 6.879310344827586,
"grad_norm": 0.8789858848023084,
"learning_rate": 3.7251562421123375e-08,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19849488139152527,
"step": 3990,
"valid_targets_mean": 2971.6,
"valid_targets_min": 393
},
{
"epoch": 6.887931034482759,
"grad_norm": 0.8963419366048488,
"learning_rate": 3.219096479084804e-08,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2406509816646576,
"step": 3995,
"valid_targets_mean": 2845.4,
"valid_targets_min": 780
},
{
"epoch": 6.896551724137931,
"grad_norm": 0.7922366801463806,
"learning_rate": 2.749937229901134e-08,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23498943448066711,
"step": 4000,
"valid_targets_mean": 2786.1,
"valid_targets_min": 1013
},
{
"epoch": 6.905172413793103,
"grad_norm": 0.9071213805483908,
"learning_rate": 2.317687164624882e-08,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22399500012397766,
"step": 4005,
"valid_targets_mean": 2348.9,
"valid_targets_min": 1112
},
{
"epoch": 6.913793103448276,
"grad_norm": 0.9367507061638377,
"learning_rate": 1.9223542712381026e-08,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24696654081344604,
"step": 4010,
"valid_targets_mean": 2180.5,
"valid_targets_min": 377
},
{
"epoch": 6.922413793103448,
"grad_norm": 0.9941698674033683,
"learning_rate": 1.563945855492799e-08,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26774609088897705,
"step": 4015,
"valid_targets_mean": 2133.8,
"valid_targets_min": 589
},
{
"epoch": 6.931034482758621,
"grad_norm": 0.8500184025790589,
"learning_rate": 1.242468540777253e-08,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2405872642993927,
"step": 4020,
"valid_targets_mean": 2453.4,
"valid_targets_min": 1091
},
{
"epoch": 6.939655172413794,
"grad_norm": 0.6095697059261187,
"learning_rate": 9.579282679927915e-09,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40256640315055847,
"step": 4025,
"valid_targets_mean": 4629.2,
"valid_targets_min": 735
},
{
"epoch": 6.948275862068965,
"grad_norm": 0.7009948391059693,
"learning_rate": 7.1033029544365085e-09,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1720399707555771,
"step": 4030,
"valid_targets_mean": 3406.2,
"valid_targets_min": 630
},
{
"epoch": 6.956896551724138,
"grad_norm": 0.7661105136161285,
"learning_rate": 4.996791987410543e-09,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1798725575208664,
"step": 4035,
"valid_targets_mean": 2961.6,
"valid_targets_min": 907
},
{
"epoch": 6.9655172413793105,
"grad_norm": 0.9354847837018981,
"learning_rate": 3.2597887071750266e-09,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20513418316841125,
"step": 4040,
"valid_targets_mean": 2190.2,
"valid_targets_min": 790
},
{
"epoch": 6.974137931034483,
"grad_norm": 0.8519742635190573,
"learning_rate": 1.892325213552759e-09,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20830674469470978,
"step": 4045,
"valid_targets_mean": 2784.9,
"valid_targets_min": 607
},
{
"epoch": 6.982758620689655,
"grad_norm": 0.9443206286590975,
"learning_rate": 8.944267772692527e-10,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20226803421974182,
"step": 4050,
"valid_targets_mean": 2149.4,
"valid_targets_min": 432
},
{
"epoch": 6.991379310344827,
"grad_norm": 0.8811578949870185,
"learning_rate": 2.66111839490879e-10,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2233564555644989,
"step": 4055,
"valid_targets_mean": 2065.1,
"valid_targets_min": 652
},
{
"epoch": 7.0,
"grad_norm": 0.9695032609226015,
"learning_rate": 7.392011478479787e-12,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25369924306869507,
"step": 4060,
"valid_targets_mean": 2212.8,
"valid_targets_min": 431
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25369924306869507,
"step": 4060,
"total_flos": 644683152949248.0,
"train_loss": 0.3271850697072269,
"train_runtime": 13949.8914,
"train_samples_per_second": 4.655,
"train_steps_per_second": 0.291,
"valid_targets_mean": 2212.8,
"valid_targets_min": 431
}
],
"logging_steps": 5,
"max_steps": 4060,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 644683152949248.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}