Files
exp-uns-r2egym-2_1x_glm_4_7…/trainer_state.json
ModelHub XC 0a1d367b76 初始化项目,由ModelHub XC社区提供模型
Model: laion/exp-uns-r2egym-2_1x_glm_4_7_traces_jupiter_cleaned
Source: Original Platform
2026-06-02 00:31:36 +08:00

10762 lines
298 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4872,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007189072609633357,
"grad_norm": 20.573642478850733,
"learning_rate": 3.278688524590164e-07,
"loss": 0.8805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3877447843551636,
"step": 5,
"valid_targets_mean": 3123.6,
"valid_targets_min": 486
},
{
"epoch": 0.014378145219266714,
"grad_norm": 23.534982518621135,
"learning_rate": 7.377049180327869e-07,
"loss": 0.8809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46912896633148193,
"step": 10,
"valid_targets_mean": 3414.8,
"valid_targets_min": 528
},
{
"epoch": 0.021567217828900073,
"grad_norm": 24.164733243587904,
"learning_rate": 1.1475409836065575e-06,
"loss": 0.87,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39718469977378845,
"step": 15,
"valid_targets_mean": 4687.1,
"valid_targets_min": 572
},
{
"epoch": 0.02875629043853343,
"grad_norm": 15.447184493591537,
"learning_rate": 1.557377049180328e-06,
"loss": 0.8027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35776641964912415,
"step": 20,
"valid_targets_mean": 3202.1,
"valid_targets_min": 616
},
{
"epoch": 0.035945363048166784,
"grad_norm": 9.664768453884538,
"learning_rate": 1.9672131147540985e-06,
"loss": 0.7594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41083261370658875,
"step": 25,
"valid_targets_mean": 3431.6,
"valid_targets_min": 640
},
{
"epoch": 0.043134435657800146,
"grad_norm": 5.254693135892583,
"learning_rate": 2.377049180327869e-06,
"loss": 0.6731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23213350772857666,
"step": 30,
"valid_targets_mean": 3386.2,
"valid_targets_min": 711
},
{
"epoch": 0.0503235082674335,
"grad_norm": 3.298015416368021,
"learning_rate": 2.786885245901639e-06,
"loss": 0.6337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3576735854148865,
"step": 35,
"valid_targets_mean": 3571.2,
"valid_targets_min": 867
},
{
"epoch": 0.05751258087706686,
"grad_norm": 2.2393410140351944,
"learning_rate": 3.1967213114754105e-06,
"loss": 0.6398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3916738033294678,
"step": 40,
"valid_targets_mean": 3223.5,
"valid_targets_min": 604
},
{
"epoch": 0.06470165348670022,
"grad_norm": 1.5520759530652233,
"learning_rate": 3.6065573770491806e-06,
"loss": 0.5755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.267872154712677,
"step": 45,
"valid_targets_mean": 3251.4,
"valid_targets_min": 735
},
{
"epoch": 0.07189072609633357,
"grad_norm": 1.5311865640065894,
"learning_rate": 4.016393442622951e-06,
"loss": 0.5943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32756370306015015,
"step": 50,
"valid_targets_mean": 4207.4,
"valid_targets_min": 566
},
{
"epoch": 0.07907979870596693,
"grad_norm": 1.0685857284108062,
"learning_rate": 4.426229508196722e-06,
"loss": 0.562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24649468064308167,
"step": 55,
"valid_targets_mean": 3997.9,
"valid_targets_min": 557
},
{
"epoch": 0.08626887131560029,
"grad_norm": 0.9461006126567058,
"learning_rate": 4.836065573770492e-06,
"loss": 0.5413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2554165720939636,
"step": 60,
"valid_targets_mean": 4351.4,
"valid_targets_min": 974
},
{
"epoch": 0.09345794392523364,
"grad_norm": 0.8074203824966353,
"learning_rate": 5.245901639344263e-06,
"loss": 0.5373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20570573210716248,
"step": 65,
"valid_targets_mean": 3216.0,
"valid_targets_min": 569
},
{
"epoch": 0.100647016534867,
"grad_norm": 0.864406247661593,
"learning_rate": 5.655737704918033e-06,
"loss": 0.5013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26434096693992615,
"step": 70,
"valid_targets_mean": 3315.5,
"valid_targets_min": 466
},
{
"epoch": 0.10783608914450037,
"grad_norm": 0.8551627943262912,
"learning_rate": 6.065573770491804e-06,
"loss": 0.4944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24443431198596954,
"step": 75,
"valid_targets_mean": 2707.8,
"valid_targets_min": 580
},
{
"epoch": 0.11502516175413371,
"grad_norm": 0.8588233832507804,
"learning_rate": 6.475409836065575e-06,
"loss": 0.4966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24194490909576416,
"step": 80,
"valid_targets_mean": 2786.4,
"valid_targets_min": 653
},
{
"epoch": 0.12221423436376708,
"grad_norm": 0.6257850424268222,
"learning_rate": 6.885245901639345e-06,
"loss": 0.4667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21724802255630493,
"step": 85,
"valid_targets_mean": 4494.2,
"valid_targets_min": 773
},
{
"epoch": 0.12940330697340044,
"grad_norm": 0.8358272469336914,
"learning_rate": 7.295081967213115e-06,
"loss": 0.4568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27527081966400146,
"step": 90,
"valid_targets_mean": 2980.9,
"valid_targets_min": 639
},
{
"epoch": 0.1365923795830338,
"grad_norm": 0.65329510451641,
"learning_rate": 7.704918032786886e-06,
"loss": 0.4659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2408151626586914,
"step": 95,
"valid_targets_mean": 4151.5,
"valid_targets_min": 777
},
{
"epoch": 0.14378145219266714,
"grad_norm": 0.7011088331824381,
"learning_rate": 8.114754098360657e-06,
"loss": 0.4525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20888058841228485,
"step": 100,
"valid_targets_mean": 3260.6,
"valid_targets_min": 509
},
{
"epoch": 0.1509705248023005,
"grad_norm": 0.6314975069994072,
"learning_rate": 8.524590163934427e-06,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18482504785060883,
"step": 105,
"valid_targets_mean": 3340.9,
"valid_targets_min": 286
},
{
"epoch": 0.15815959741193386,
"grad_norm": 0.6827616460242438,
"learning_rate": 8.934426229508197e-06,
"loss": 0.4346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2140287458896637,
"step": 110,
"valid_targets_mean": 3119.0,
"valid_targets_min": 621
},
{
"epoch": 0.16534867002156722,
"grad_norm": 0.6892155095210419,
"learning_rate": 9.344262295081968e-06,
"loss": 0.4294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17718997597694397,
"step": 115,
"valid_targets_mean": 2981.2,
"valid_targets_min": 359
},
{
"epoch": 0.17253774263120059,
"grad_norm": 0.6184317431223036,
"learning_rate": 9.754098360655738e-06,
"loss": 0.4188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19387683272361755,
"step": 120,
"valid_targets_mean": 3474.8,
"valid_targets_min": 368
},
{
"epoch": 0.17972681524083392,
"grad_norm": 0.713134279760954,
"learning_rate": 1.0163934426229509e-05,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26430848240852356,
"step": 125,
"valid_targets_mean": 3852.6,
"valid_targets_min": 597
},
{
"epoch": 0.18691588785046728,
"grad_norm": 0.6130847433392762,
"learning_rate": 1.0573770491803279e-05,
"loss": 0.4123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.211105078458786,
"step": 130,
"valid_targets_mean": 4527.5,
"valid_targets_min": 985
},
{
"epoch": 0.19410496046010065,
"grad_norm": 0.6406368473479827,
"learning_rate": 1.0983606557377052e-05,
"loss": 0.4021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940620243549347,
"step": 135,
"valid_targets_mean": 3756.5,
"valid_targets_min": 779
},
{
"epoch": 0.201294033069734,
"grad_norm": 0.6589114143141694,
"learning_rate": 1.1393442622950821e-05,
"loss": 0.3855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18273743987083435,
"step": 140,
"valid_targets_mean": 4232.9,
"valid_targets_min": 3231
},
{
"epoch": 0.20848310567936737,
"grad_norm": 0.7140798654127781,
"learning_rate": 1.1803278688524591e-05,
"loss": 0.399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22288499772548676,
"step": 145,
"valid_targets_mean": 4247.5,
"valid_targets_min": 805
},
{
"epoch": 0.21567217828900073,
"grad_norm": 0.6264015086815747,
"learning_rate": 1.221311475409836e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2211969941854477,
"step": 150,
"valid_targets_mean": 4673.0,
"valid_targets_min": 1091
},
{
"epoch": 0.22286125089863407,
"grad_norm": 0.6162894585137502,
"learning_rate": 1.2622950819672132e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20758062601089478,
"step": 155,
"valid_targets_mean": 4587.4,
"valid_targets_min": 4059
},
{
"epoch": 0.23005032350826743,
"grad_norm": 0.7212307073246284,
"learning_rate": 1.3032786885245904e-05,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1758236587047577,
"step": 160,
"valid_targets_mean": 3042.4,
"valid_targets_min": 761
},
{
"epoch": 0.2372393961179008,
"grad_norm": 0.680625458237956,
"learning_rate": 1.3442622950819673e-05,
"loss": 0.3782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18720507621765137,
"step": 165,
"valid_targets_mean": 3616.2,
"valid_targets_min": 509
},
{
"epoch": 0.24442846872753415,
"grad_norm": 0.7144132390270651,
"learning_rate": 1.3852459016393445e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16533072292804718,
"step": 170,
"valid_targets_mean": 2691.1,
"valid_targets_min": 489
},
{
"epoch": 0.2516175413371675,
"grad_norm": 0.7023635269438706,
"learning_rate": 1.4262295081967214e-05,
"loss": 0.3832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2062736600637436,
"step": 175,
"valid_targets_mean": 4041.8,
"valid_targets_min": 523
},
{
"epoch": 0.2588066139468009,
"grad_norm": 0.6519958114973764,
"learning_rate": 1.4672131147540984e-05,
"loss": 0.3795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1904088258743286,
"step": 180,
"valid_targets_mean": 4690.5,
"valid_targets_min": 642
},
{
"epoch": 0.26599568655643424,
"grad_norm": 0.803127069107535,
"learning_rate": 1.5081967213114754e-05,
"loss": 0.3747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19250091910362244,
"step": 185,
"valid_targets_mean": 3694.6,
"valid_targets_min": 622
},
{
"epoch": 0.2731847591660676,
"grad_norm": 0.6524842255260931,
"learning_rate": 1.5491803278688525e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14555513858795166,
"step": 190,
"valid_targets_mean": 3740.8,
"valid_targets_min": 556
},
{
"epoch": 0.2803738317757009,
"grad_norm": 0.7353147851076066,
"learning_rate": 1.5901639344262295e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18715769052505493,
"step": 195,
"valid_targets_mean": 3398.0,
"valid_targets_min": 545
},
{
"epoch": 0.2875629043853343,
"grad_norm": 0.699110190722482,
"learning_rate": 1.6311475409836068e-05,
"loss": 0.3718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19545572996139526,
"step": 200,
"valid_targets_mean": 3607.5,
"valid_targets_min": 568
},
{
"epoch": 0.29475197699496763,
"grad_norm": 1.1808205066742428,
"learning_rate": 1.6721311475409837e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16610263288021088,
"step": 205,
"valid_targets_mean": 3263.6,
"valid_targets_min": 636
},
{
"epoch": 0.301941049604601,
"grad_norm": 0.6397168520175814,
"learning_rate": 1.7131147540983607e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19341236352920532,
"step": 210,
"valid_targets_mean": 3819.5,
"valid_targets_min": 852
},
{
"epoch": 0.30913012221423436,
"grad_norm": 0.6379639056463705,
"learning_rate": 1.7540983606557377e-05,
"loss": 0.3826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17195996642112732,
"step": 215,
"valid_targets_mean": 3233.1,
"valid_targets_min": 500
},
{
"epoch": 0.3163191948238677,
"grad_norm": 0.5942179551543917,
"learning_rate": 1.795081967213115e-05,
"loss": 0.3577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16106751561164856,
"step": 220,
"valid_targets_mean": 4271.6,
"valid_targets_min": 601
},
{
"epoch": 0.3235082674335011,
"grad_norm": 0.826034647461399,
"learning_rate": 1.836065573770492e-05,
"loss": 0.3718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17342892289161682,
"step": 225,
"valid_targets_mean": 3681.0,
"valid_targets_min": 813
},
{
"epoch": 0.33069734004313445,
"grad_norm": 0.8058653706281842,
"learning_rate": 1.877049180327869e-05,
"loss": 0.3666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1488562822341919,
"step": 230,
"valid_targets_mean": 3804.8,
"valid_targets_min": 648
},
{
"epoch": 0.3378864126527678,
"grad_norm": 0.6344857788769837,
"learning_rate": 1.918032786885246e-05,
"loss": 0.3629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1404256522655487,
"step": 235,
"valid_targets_mean": 3125.4,
"valid_targets_min": 617
},
{
"epoch": 0.34507548526240117,
"grad_norm": 0.6434328742127456,
"learning_rate": 1.9590163934426232e-05,
"loss": 0.3646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13383261859416962,
"step": 240,
"valid_targets_mean": 2855.4,
"valid_targets_min": 630
},
{
"epoch": 0.35226455787203453,
"grad_norm": 0.7064545774971568,
"learning_rate": 2e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14416509866714478,
"step": 245,
"valid_targets_mean": 2471.6,
"valid_targets_min": 556
},
{
"epoch": 0.35945363048166784,
"grad_norm": 0.6931492333324353,
"learning_rate": 2.040983606557377e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1825331151485443,
"step": 250,
"valid_targets_mean": 4504.8,
"valid_targets_min": 3506
},
{
"epoch": 0.3666427030913012,
"grad_norm": 0.657195768961274,
"learning_rate": 2.081967213114754e-05,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2167544960975647,
"step": 255,
"valid_targets_mean": 4500.5,
"valid_targets_min": 894
},
{
"epoch": 0.37383177570093457,
"grad_norm": 0.6384973135842494,
"learning_rate": 2.122950819672131e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17248007655143738,
"step": 260,
"valid_targets_mean": 4212.5,
"valid_targets_min": 829
},
{
"epoch": 0.38102084831056793,
"grad_norm": 0.7144789700157379,
"learning_rate": 2.1639344262295087e-05,
"loss": 0.3607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16193635761737823,
"step": 265,
"valid_targets_mean": 2716.9,
"valid_targets_min": 593
},
{
"epoch": 0.3882099209202013,
"grad_norm": 0.598654567786524,
"learning_rate": 2.2049180327868857e-05,
"loss": 0.3483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1530938744544983,
"step": 270,
"valid_targets_mean": 4164.4,
"valid_targets_min": 865
},
{
"epoch": 0.39539899352983465,
"grad_norm": 0.6904258025944402,
"learning_rate": 2.2459016393442626e-05,
"loss": 0.3401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17960868775844574,
"step": 275,
"valid_targets_mean": 4070.1,
"valid_targets_min": 740
},
{
"epoch": 0.402588066139468,
"grad_norm": 0.6894409028737439,
"learning_rate": 2.2868852459016396e-05,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1807325780391693,
"step": 280,
"valid_targets_mean": 4034.6,
"valid_targets_min": 845
},
{
"epoch": 0.4097771387491014,
"grad_norm": 0.6802842259041161,
"learning_rate": 2.3278688524590166e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1755760908126831,
"step": 285,
"valid_targets_mean": 4237.8,
"valid_targets_min": 462
},
{
"epoch": 0.41696621135873474,
"grad_norm": 0.7153194015500277,
"learning_rate": 2.3688524590163936e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14597834646701813,
"step": 290,
"valid_targets_mean": 3897.8,
"valid_targets_min": 762
},
{
"epoch": 0.4241552839683681,
"grad_norm": 0.626280930870836,
"learning_rate": 2.4098360655737705e-05,
"loss": 0.3368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1872946321964264,
"step": 295,
"valid_targets_mean": 4110.1,
"valid_targets_min": 723
},
{
"epoch": 0.43134435657800146,
"grad_norm": 0.6413132226933951,
"learning_rate": 2.4508196721311478e-05,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21533772349357605,
"step": 300,
"valid_targets_mean": 4881.5,
"valid_targets_min": 3844
},
{
"epoch": 0.43853342918763477,
"grad_norm": 0.6984612265778307,
"learning_rate": 2.4918032786885248e-05,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20868580043315887,
"step": 305,
"valid_targets_mean": 3898.6,
"valid_targets_min": 769
},
{
"epoch": 0.44572250179726813,
"grad_norm": 0.6522216187873998,
"learning_rate": 2.5327868852459018e-05,
"loss": 0.3455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19474999606609344,
"step": 310,
"valid_targets_mean": 4632.5,
"valid_targets_min": 450
},
{
"epoch": 0.4529115744069015,
"grad_norm": 0.7149143783713475,
"learning_rate": 2.5737704918032787e-05,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14127987623214722,
"step": 315,
"valid_targets_mean": 3658.1,
"valid_targets_min": 760
},
{
"epoch": 0.46010064701653486,
"grad_norm": 0.7290870789351198,
"learning_rate": 2.6147540983606557e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2236519455909729,
"step": 320,
"valid_targets_mean": 3496.0,
"valid_targets_min": 764
},
{
"epoch": 0.4672897196261682,
"grad_norm": 0.8173532165490279,
"learning_rate": 2.655737704918033e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22370921075344086,
"step": 325,
"valid_targets_mean": 2928.8,
"valid_targets_min": 587
},
{
"epoch": 0.4744787922358016,
"grad_norm": 0.6390755149026872,
"learning_rate": 2.6967213114754103e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17742975056171417,
"step": 330,
"valid_targets_mean": 4116.4,
"valid_targets_min": 744
},
{
"epoch": 0.48166786484543495,
"grad_norm": 0.7504325873347869,
"learning_rate": 2.7377049180327873e-05,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19246351718902588,
"step": 335,
"valid_targets_mean": 4115.6,
"valid_targets_min": 504
},
{
"epoch": 0.4888569374550683,
"grad_norm": 0.6918553039170531,
"learning_rate": 2.7786885245901642e-05,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16972219944000244,
"step": 340,
"valid_targets_mean": 4123.5,
"valid_targets_min": 647
},
{
"epoch": 0.49604601006470167,
"grad_norm": 0.8450381784807004,
"learning_rate": 2.8196721311475412e-05,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13487985730171204,
"step": 345,
"valid_targets_mean": 2433.0,
"valid_targets_min": 307
},
{
"epoch": 0.503235082674335,
"grad_norm": 0.6459380214431669,
"learning_rate": 2.8606557377049182e-05,
"loss": 0.3689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15826758742332458,
"step": 350,
"valid_targets_mean": 4429.6,
"valid_targets_min": 542
},
{
"epoch": 0.5104241552839683,
"grad_norm": 0.6500752629382867,
"learning_rate": 2.901639344262295e-05,
"loss": 0.3305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1564514935016632,
"step": 355,
"valid_targets_mean": 4117.2,
"valid_targets_min": 520
},
{
"epoch": 0.5176132278936018,
"grad_norm": 0.599014418508955,
"learning_rate": 2.942622950819672e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1816200613975525,
"step": 360,
"valid_targets_mean": 4451.4,
"valid_targets_min": 238
},
{
"epoch": 0.5248023005032351,
"grad_norm": 0.7406430431356334,
"learning_rate": 2.9836065573770498e-05,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23748645186424255,
"step": 365,
"valid_targets_mean": 4112.0,
"valid_targets_min": 624
},
{
"epoch": 0.5319913731128685,
"grad_norm": 0.7126978990023,
"learning_rate": 3.0245901639344267e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1286466419696808,
"step": 370,
"valid_targets_mean": 3026.0,
"valid_targets_min": 524
},
{
"epoch": 0.5391804457225018,
"grad_norm": 0.6742826194350676,
"learning_rate": 3.065573770491804e-05,
"loss": 0.3315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14347417652606964,
"step": 375,
"valid_targets_mean": 3989.8,
"valid_targets_min": 767
},
{
"epoch": 0.5463695183321352,
"grad_norm": 0.6286067545561252,
"learning_rate": 3.106557377049181e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17555642127990723,
"step": 380,
"valid_targets_mean": 4182.5,
"valid_targets_min": 878
},
{
"epoch": 0.5535585909417685,
"grad_norm": 0.6903987730789588,
"learning_rate": 3.1475409836065576e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19024711847305298,
"step": 385,
"valid_targets_mean": 3651.9,
"valid_targets_min": 709
},
{
"epoch": 0.5607476635514018,
"grad_norm": 0.6375843615935716,
"learning_rate": 3.1885245901639346e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14437010884284973,
"step": 390,
"valid_targets_mean": 3916.0,
"valid_targets_min": 572
},
{
"epoch": 0.5679367361610352,
"grad_norm": 0.7053727765954131,
"learning_rate": 3.2295081967213116e-05,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976805031299591,
"step": 395,
"valid_targets_mean": 4752.4,
"valid_targets_min": 652
},
{
"epoch": 0.5751258087706685,
"grad_norm": 0.8072569984620446,
"learning_rate": 3.270491803278689e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19607961177825928,
"step": 400,
"valid_targets_mean": 3763.6,
"valid_targets_min": 828
},
{
"epoch": 0.582314881380302,
"grad_norm": 0.6106476152608095,
"learning_rate": 3.311475409836066e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13127343356609344,
"step": 405,
"valid_targets_mean": 3272.8,
"valid_targets_min": 377
},
{
"epoch": 0.5895039539899353,
"grad_norm": 0.6482116985826718,
"learning_rate": 3.352459016393443e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12706303596496582,
"step": 410,
"valid_targets_mean": 3338.0,
"valid_targets_min": 742
},
{
"epoch": 0.5966930265995687,
"grad_norm": 0.6632153860197335,
"learning_rate": 3.39344262295082e-05,
"loss": 0.33,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21092239022254944,
"step": 415,
"valid_targets_mean": 4265.2,
"valid_targets_min": 405
},
{
"epoch": 0.603882099209202,
"grad_norm": 0.7713246956378941,
"learning_rate": 3.434426229508197e-05,
"loss": 0.3262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19024214148521423,
"step": 420,
"valid_targets_mean": 3687.9,
"valid_targets_min": 314
},
{
"epoch": 0.6110711718188354,
"grad_norm": 0.6573267560100432,
"learning_rate": 3.475409836065574e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21130415797233582,
"step": 425,
"valid_targets_mean": 4377.6,
"valid_targets_min": 879
},
{
"epoch": 0.6182602444284687,
"grad_norm": 0.7418379210193793,
"learning_rate": 3.516393442622951e-05,
"loss": 0.3249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14313599467277527,
"step": 430,
"valid_targets_mean": 2593.2,
"valid_targets_min": 499
},
{
"epoch": 0.6254493170381021,
"grad_norm": 0.7328316064174966,
"learning_rate": 3.557377049180329e-05,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20951959490776062,
"step": 435,
"valid_targets_mean": 3922.9,
"valid_targets_min": 599
},
{
"epoch": 0.6326383896477354,
"grad_norm": 0.6249361811748065,
"learning_rate": 3.5983606557377056e-05,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14408886432647705,
"step": 440,
"valid_targets_mean": 3574.6,
"valid_targets_min": 221
},
{
"epoch": 0.6398274622573688,
"grad_norm": 0.570165396935894,
"learning_rate": 3.6393442622950826e-05,
"loss": 0.3395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18353965878486633,
"step": 445,
"valid_targets_mean": 4853.2,
"valid_targets_min": 1054
},
{
"epoch": 0.6470165348670022,
"grad_norm": 0.6538256952663059,
"learning_rate": 3.6803278688524596e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1699550598859787,
"step": 450,
"valid_targets_mean": 4320.8,
"valid_targets_min": 2765
},
{
"epoch": 0.6542056074766355,
"grad_norm": 0.7548701580728006,
"learning_rate": 3.7213114754098365e-05,
"loss": 0.3269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1741151511669159,
"step": 455,
"valid_targets_mean": 3483.0,
"valid_targets_min": 674
},
{
"epoch": 0.6613946800862689,
"grad_norm": 0.6187130203116966,
"learning_rate": 3.7622950819672135e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886174976825714,
"step": 460,
"valid_targets_mean": 4379.4,
"valid_targets_min": 3644
},
{
"epoch": 0.6685837526959022,
"grad_norm": 0.6026210220029745,
"learning_rate": 3.8032786885245905e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16248294711112976,
"step": 465,
"valid_targets_mean": 3981.2,
"valid_targets_min": 768
},
{
"epoch": 0.6757728253055356,
"grad_norm": 0.5738755197300025,
"learning_rate": 3.8442622950819674e-05,
"loss": 0.3266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1635032296180725,
"step": 470,
"valid_targets_mean": 3884.6,
"valid_targets_min": 634
},
{
"epoch": 0.6829618979151689,
"grad_norm": 0.541333478441975,
"learning_rate": 3.8852459016393444e-05,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1343890130519867,
"step": 475,
"valid_targets_mean": 3901.5,
"valid_targets_min": 671
},
{
"epoch": 0.6901509705248023,
"grad_norm": 0.6297950944669213,
"learning_rate": 3.9262295081967214e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1319078505039215,
"step": 480,
"valid_targets_mean": 2984.2,
"valid_targets_min": 421
},
{
"epoch": 0.6973400431344356,
"grad_norm": 0.6442069487231398,
"learning_rate": 3.9672131147540983e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16742603480815887,
"step": 485,
"valid_targets_mean": 3123.9,
"valid_targets_min": 601
},
{
"epoch": 0.7045291157440691,
"grad_norm": 0.5828680764992784,
"learning_rate": 3.999999486478495e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16095879673957825,
"step": 490,
"valid_targets_mean": 3849.0,
"valid_targets_min": 911
},
{
"epoch": 0.7117181883537024,
"grad_norm": 0.727100638844294,
"learning_rate": 3.999981513253493e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447129249572754,
"step": 495,
"valid_targets_mean": 2987.5,
"valid_targets_min": 549
},
{
"epoch": 0.7189072609633357,
"grad_norm": 0.66368309677484,
"learning_rate": 3.999937864216924e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2023858278989792,
"step": 500,
"valid_targets_mean": 4051.2,
"valid_targets_min": 862
},
{
"epoch": 0.7260963335729691,
"grad_norm": 0.6046587260631622,
"learning_rate": 3.999868539929155e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15529820322990417,
"step": 505,
"valid_targets_mean": 4291.5,
"valid_targets_min": 735
},
{
"epoch": 0.7332854061826024,
"grad_norm": 0.6538819878012135,
"learning_rate": 3.999773541280172e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1858222782611847,
"step": 510,
"valid_targets_mean": 3583.4,
"valid_targets_min": 785
},
{
"epoch": 0.7404744787922358,
"grad_norm": 0.5785423134923583,
"learning_rate": 3.999652869489569e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16107608377933502,
"step": 515,
"valid_targets_mean": 4236.2,
"valid_targets_min": 838
},
{
"epoch": 0.7476635514018691,
"grad_norm": 0.6661760659117584,
"learning_rate": 3.9995065261065356e-05,
"loss": 0.3146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17083489894866943,
"step": 520,
"valid_targets_mean": 3330.0,
"valid_targets_min": 582
},
{
"epoch": 0.7548526240115025,
"grad_norm": 0.5814852024495063,
"learning_rate": 3.9993345130098316e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17902444303035736,
"step": 525,
"valid_targets_mean": 4703.5,
"valid_targets_min": 575
},
{
"epoch": 0.7620416966211359,
"grad_norm": 0.7517015730135961,
"learning_rate": 3.9991368324077635e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15405789017677307,
"step": 530,
"valid_targets_mean": 2682.0,
"valid_targets_min": 737
},
{
"epoch": 0.7692307692307693,
"grad_norm": 0.5665123479287115,
"learning_rate": 3.998913486838161e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16368168592453003,
"step": 535,
"valid_targets_mean": 4069.4,
"valid_targets_min": 736
},
{
"epoch": 0.7764198418404026,
"grad_norm": 0.6136339063989368,
"learning_rate": 3.9986644791683404e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1443198025226593,
"step": 540,
"valid_targets_mean": 3335.1,
"valid_targets_min": 552
},
{
"epoch": 0.783608914450036,
"grad_norm": 0.5666189504479666,
"learning_rate": 3.998389812595067e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1655181646347046,
"step": 545,
"valid_targets_mean": 4019.6,
"valid_targets_min": 691
},
{
"epoch": 0.7907979870596693,
"grad_norm": 0.6059954759818537,
"learning_rate": 3.998089490644518e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14678184688091278,
"step": 550,
"valid_targets_mean": 4046.4,
"valid_targets_min": 965
},
{
"epoch": 0.7979870596693026,
"grad_norm": 0.6997466690052564,
"learning_rate": 3.9977635171722334e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18480221927165985,
"step": 555,
"valid_targets_mean": 3190.5,
"valid_targets_min": 521
},
{
"epoch": 0.805176132278936,
"grad_norm": 0.6538968759183521,
"learning_rate": 3.997411896363069e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14448435604572296,
"step": 560,
"valid_targets_mean": 2742.0,
"valid_targets_min": 577
},
{
"epoch": 0.8123652048885693,
"grad_norm": 0.6256037112502639,
"learning_rate": 3.997034632731141e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16057893633842468,
"step": 565,
"valid_targets_mean": 3521.4,
"valid_targets_min": 767
},
{
"epoch": 0.8195542774982028,
"grad_norm": 0.5840588259185012,
"learning_rate": 3.9966317311197686e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12496450543403625,
"step": 570,
"valid_targets_mean": 3774.1,
"valid_targets_min": 939
},
{
"epoch": 0.8267433501078361,
"grad_norm": 0.5874137343327693,
"learning_rate": 3.996203196701414e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1374460607767105,
"step": 575,
"valid_targets_mean": 2572.0,
"valid_targets_min": 582
},
{
"epoch": 0.8339324227174695,
"grad_norm": 0.5907503480926745,
"learning_rate": 3.9957490349776114e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14356018602848053,
"step": 580,
"valid_targets_mean": 3366.4,
"valid_targets_min": 675
},
{
"epoch": 0.8411214953271028,
"grad_norm": 0.6733516990659187,
"learning_rate": 3.9952692517789004e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11857141554355621,
"step": 585,
"valid_targets_mean": 2340.8,
"valid_targets_min": 528
},
{
"epoch": 0.8483105679367362,
"grad_norm": 0.5327001453074538,
"learning_rate": 3.9947638532647495e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09966681897640228,
"step": 590,
"valid_targets_mean": 2746.8,
"valid_targets_min": 551
},
{
"epoch": 0.8554996405463695,
"grad_norm": 0.5572753499291244,
"learning_rate": 3.994232845923477e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21287260949611664,
"step": 595,
"valid_targets_mean": 5236.8,
"valid_targets_min": 3550
},
{
"epoch": 0.8626887131560029,
"grad_norm": 0.6260309292514555,
"learning_rate": 3.993676236572169e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1779523491859436,
"step": 600,
"valid_targets_mean": 3889.1,
"valid_targets_min": 638
},
{
"epoch": 0.8698777857656362,
"grad_norm": 0.7575276187630292,
"learning_rate": 3.9930940323565885e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13865935802459717,
"step": 605,
"valid_targets_mean": 1711.0,
"valid_targets_min": 468
},
{
"epoch": 0.8770668583752695,
"grad_norm": 0.5771116052061334,
"learning_rate": 3.992486240751088e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751812994480133,
"step": 610,
"valid_targets_mean": 4495.6,
"valid_targets_min": 859
},
{
"epoch": 0.884255930984903,
"grad_norm": 0.569118648358242,
"learning_rate": 3.991852869558512e-05,
"loss": 0.3095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15517261624336243,
"step": 615,
"valid_targets_mean": 3612.4,
"valid_targets_min": 766
},
{
"epoch": 0.8914450035945363,
"grad_norm": 0.5972077897181785,
"learning_rate": 3.9911939269100944e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.150088369846344,
"step": 620,
"valid_targets_mean": 3230.4,
"valid_targets_min": 1066
},
{
"epoch": 0.8986340762041697,
"grad_norm": 0.5925744591529776,
"learning_rate": 3.990509421265357e-05,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1893511861562729,
"step": 625,
"valid_targets_mean": 4402.9,
"valid_targets_min": 577
},
{
"epoch": 0.905823148813803,
"grad_norm": 0.5548472057370831,
"learning_rate": 3.9897993614120006e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14507707953453064,
"step": 630,
"valid_targets_mean": 3072.5,
"valid_targets_min": 651
},
{
"epoch": 0.9130122214234364,
"grad_norm": 0.7175648198925466,
"learning_rate": 3.9890637564657894e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17302565276622772,
"step": 635,
"valid_targets_mean": 2339.6,
"valid_targets_min": 586
},
{
"epoch": 0.9202012940330697,
"grad_norm": 0.584831764924473,
"learning_rate": 3.98830261587044e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14775174856185913,
"step": 640,
"valid_targets_mean": 2893.2,
"valid_targets_min": 550
},
{
"epoch": 0.9273903666427031,
"grad_norm": 0.5577687168235862,
"learning_rate": 3.987515949397492e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15221062302589417,
"step": 645,
"valid_targets_mean": 3455.2,
"valid_targets_min": 656
},
{
"epoch": 0.9345794392523364,
"grad_norm": 0.6171762638763584,
"learning_rate": 3.98670376714619e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562863290309906,
"step": 650,
"valid_targets_mean": 3444.6,
"valid_targets_min": 382
},
{
"epoch": 0.9417685118619699,
"grad_norm": 0.5304534943571708,
"learning_rate": 3.98586607954335e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1725115031003952,
"step": 655,
"valid_targets_mean": 4867.2,
"valid_targets_min": 3896
},
{
"epoch": 0.9489575844716032,
"grad_norm": 0.6458847453284171,
"learning_rate": 3.9850028973432235e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1688905954360962,
"step": 660,
"valid_targets_mean": 2693.9,
"valid_targets_min": 607
},
{
"epoch": 0.9561466570812365,
"grad_norm": 0.6039242605720511,
"learning_rate": 3.9841142316273675e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14590154588222504,
"step": 665,
"valid_targets_mean": 2759.8,
"valid_targets_min": 477
},
{
"epoch": 0.9633357296908699,
"grad_norm": 0.5542962369979113,
"learning_rate": 3.983200093804493e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1160636693239212,
"step": 670,
"valid_targets_mean": 3096.2,
"valid_targets_min": 319
},
{
"epoch": 0.9705248023005032,
"grad_norm": 0.5550120004817779,
"learning_rate": 3.982260495610324e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12880077958106995,
"step": 675,
"valid_targets_mean": 3627.6,
"valid_targets_min": 807
},
{
"epoch": 0.9777138749101366,
"grad_norm": 0.6372929298938798,
"learning_rate": 3.981295449107444e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17799600958824158,
"step": 680,
"valid_targets_mean": 3177.5,
"valid_targets_min": 490
},
{
"epoch": 0.9849029475197699,
"grad_norm": 0.6615093926941519,
"learning_rate": 3.980304966685145e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17152747511863708,
"step": 685,
"valid_targets_mean": 2525.2,
"valid_targets_min": 552
},
{
"epoch": 0.9920920201294033,
"grad_norm": 0.5636978041977779,
"learning_rate": 3.9792890610592634e-05,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13472625613212585,
"step": 690,
"valid_targets_mean": 3632.8,
"valid_targets_min": 643
},
{
"epoch": 0.9992810927390366,
"grad_norm": 0.581225709789264,
"learning_rate": 3.9782477452720216e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12449763715267181,
"step": 695,
"valid_targets_mean": 2487.5,
"valid_targets_min": 669
},
{
"epoch": 1.0057512580877066,
"grad_norm": 0.5553439973715237,
"learning_rate": 3.9771810326918565e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13287323713302612,
"step": 700,
"valid_targets_mean": 3585.4,
"valid_targets_min": 614
},
{
"epoch": 1.0129403306973401,
"grad_norm": 0.5197160209197271,
"learning_rate": 3.9760889370132504e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12326624989509583,
"step": 705,
"valid_targets_mean": 4040.6,
"valid_targets_min": 761
},
{
"epoch": 1.0201294033069734,
"grad_norm": 0.5196009784810837,
"learning_rate": 3.9749714722565537e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603870689868927,
"step": 710,
"valid_targets_mean": 4360.2,
"valid_targets_min": 724
},
{
"epoch": 1.0273184759166067,
"grad_norm": 0.6261659804356468,
"learning_rate": 3.9738286527678074e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1782304346561432,
"step": 715,
"valid_targets_mean": 4026.9,
"valid_targets_min": 854
},
{
"epoch": 1.03450754852624,
"grad_norm": 0.49968328840683635,
"learning_rate": 3.972660493218555e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1302112638950348,
"step": 720,
"valid_targets_mean": 4280.0,
"valid_targets_min": 693
},
{
"epoch": 1.0416966211358736,
"grad_norm": 0.5850771062290935,
"learning_rate": 3.9714670086056595e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1399659812450409,
"step": 725,
"valid_targets_mean": 3400.4,
"valid_targets_min": 853
},
{
"epoch": 1.0488856937455069,
"grad_norm": 0.5603228569463079,
"learning_rate": 3.970248214251102e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19615839421749115,
"step": 730,
"valid_targets_mean": 4814.4,
"valid_targets_min": 542
},
{
"epoch": 1.0560747663551402,
"grad_norm": 0.5648677645837813,
"learning_rate": 3.969004125801797e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1610637754201889,
"step": 735,
"valid_targets_mean": 3886.6,
"valid_targets_min": 446
},
{
"epoch": 1.0632638389647735,
"grad_norm": 0.5661342249379625,
"learning_rate": 3.967734759229382e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11380840837955475,
"step": 740,
"valid_targets_mean": 2696.4,
"valid_targets_min": 563
},
{
"epoch": 1.0704529115744068,
"grad_norm": 0.5656284137955258,
"learning_rate": 3.9664401308300154e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1349925696849823,
"step": 745,
"valid_targets_mean": 3692.1,
"valid_targets_min": 577
},
{
"epoch": 1.0776419841840403,
"grad_norm": 0.5463550825307542,
"learning_rate": 3.9651202572241686e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740422248840332,
"step": 750,
"valid_targets_mean": 4041.4,
"valid_targets_min": 1094
},
{
"epoch": 1.0848310567936736,
"grad_norm": 0.5384229571092451,
"learning_rate": 3.96377515535641e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1499461531639099,
"step": 755,
"valid_targets_mean": 4691.0,
"valid_targets_min": 678
},
{
"epoch": 1.092020129403307,
"grad_norm": 0.633330557474276,
"learning_rate": 3.962404842495193e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1790314018726349,
"step": 760,
"valid_targets_mean": 4441.2,
"valid_targets_min": 3412
},
{
"epoch": 1.0992092020129403,
"grad_norm": 0.5429522369804931,
"learning_rate": 3.961009336232625e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13355664908885956,
"step": 765,
"valid_targets_mean": 3497.9,
"valid_targets_min": 525
},
{
"epoch": 1.1063982746225738,
"grad_norm": 0.5462783839750516,
"learning_rate": 3.9595886544842505e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13674771785736084,
"step": 770,
"valid_targets_mean": 3951.1,
"valid_targets_min": 824
},
{
"epoch": 1.113587347232207,
"grad_norm": 0.5817114409791175,
"learning_rate": 3.958142815488817e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17169195413589478,
"step": 775,
"valid_targets_mean": 4445.0,
"valid_targets_min": 691
},
{
"epoch": 1.1207764198418404,
"grad_norm": 0.5648447798317549,
"learning_rate": 3.9566718378080404e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19211627542972565,
"step": 780,
"valid_targets_mean": 5507.4,
"valid_targets_min": 4306
},
{
"epoch": 1.1279654924514737,
"grad_norm": 0.49341847979292497,
"learning_rate": 3.955175740326368e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11916790157556534,
"step": 785,
"valid_targets_mean": 3905.2,
"valid_targets_min": 915
},
{
"epoch": 1.1351545650611072,
"grad_norm": 0.5330042034626139,
"learning_rate": 3.953654542250735e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1617271602153778,
"step": 790,
"valid_targets_mean": 4198.2,
"valid_targets_min": 638
},
{
"epoch": 1.1423436376707405,
"grad_norm": 0.5544000058211358,
"learning_rate": 3.952108263110322e-05,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18863481283187866,
"step": 795,
"valid_targets_mean": 4211.5,
"valid_targets_min": 678
},
{
"epoch": 1.1495327102803738,
"grad_norm": 0.5235489672450487,
"learning_rate": 3.950536922756297e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14819476008415222,
"step": 800,
"valid_targets_mean": 4272.1,
"valid_targets_min": 919
},
{
"epoch": 1.1567217828900072,
"grad_norm": 0.5772533147962314,
"learning_rate": 3.948940541361565e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17812474071979523,
"step": 805,
"valid_targets_mean": 4165.8,
"valid_targets_min": 498
},
{
"epoch": 1.1639108554996405,
"grad_norm": 0.5665999962700897,
"learning_rate": 3.9473191394205104e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22693896293640137,
"step": 810,
"valid_targets_mean": 4864.1,
"valid_targets_min": 918
},
{
"epoch": 1.171099928109274,
"grad_norm": 0.5703615550122877,
"learning_rate": 3.945672737748731e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13685652613639832,
"step": 815,
"valid_targets_mean": 3327.9,
"valid_targets_min": 632
},
{
"epoch": 1.1782890007189073,
"grad_norm": 0.5198138670541621,
"learning_rate": 3.9440013574827706e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14325293898582458,
"step": 820,
"valid_targets_mean": 4258.8,
"valid_targets_min": 643
},
{
"epoch": 1.1854780733285406,
"grad_norm": 0.5606799589906808,
"learning_rate": 3.942305020079852e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12138460576534271,
"step": 825,
"valid_targets_mean": 3280.8,
"valid_targets_min": 704
},
{
"epoch": 1.192667145938174,
"grad_norm": 0.530676980031532,
"learning_rate": 3.9405837473175944e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585422158241272,
"step": 830,
"valid_targets_mean": 4695.2,
"valid_targets_min": 649
},
{
"epoch": 1.1998562185478074,
"grad_norm": 0.6260228453322427,
"learning_rate": 3.9388375612937403e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.139860600233078,
"step": 835,
"valid_targets_mean": 3119.8,
"valid_targets_min": 620
},
{
"epoch": 1.2070452911574407,
"grad_norm": 0.5979955679371329,
"learning_rate": 3.9370664844258684e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2046428620815277,
"step": 840,
"valid_targets_mean": 4263.0,
"valid_targets_min": 811
},
{
"epoch": 1.214234363767074,
"grad_norm": 0.5717668797739937,
"learning_rate": 3.935270539451107e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10338851064443588,
"step": 845,
"valid_targets_mean": 2618.5,
"valid_targets_min": 640
},
{
"epoch": 1.2214234363767074,
"grad_norm": 0.6324183749578863,
"learning_rate": 3.933449749425842e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18412905931472778,
"step": 850,
"valid_targets_mean": 3746.4,
"valid_targets_min": 704
},
{
"epoch": 1.2286125089863407,
"grad_norm": 0.5586992298582395,
"learning_rate": 3.931604137725419e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14152535796165466,
"step": 855,
"valid_targets_mean": 3474.4,
"valid_targets_min": 631
},
{
"epoch": 1.2358015815959742,
"grad_norm": 0.5379461460790473,
"learning_rate": 3.9297337280438475e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19222573935985565,
"step": 860,
"valid_targets_mean": 4866.8,
"valid_targets_min": 1089
},
{
"epoch": 1.2429906542056075,
"grad_norm": 0.5721426437343275,
"learning_rate": 3.927838544393492e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1283596009016037,
"step": 865,
"valid_targets_mean": 2917.4,
"valid_targets_min": 567
},
{
"epoch": 1.2501797268152408,
"grad_norm": 0.5517369618312897,
"learning_rate": 3.925918611104767e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15437334775924683,
"step": 870,
"valid_targets_mean": 2915.2,
"valid_targets_min": 598
},
{
"epoch": 1.2573687994248741,
"grad_norm": 0.48267731416875964,
"learning_rate": 3.923973952825822e-05,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15360784530639648,
"step": 875,
"valid_targets_mean": 4809.2,
"valid_targets_min": 766
},
{
"epoch": 1.2645578720345076,
"grad_norm": 0.6005327005122898,
"learning_rate": 3.922004594522229e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168386310338974,
"step": 880,
"valid_targets_mean": 3697.8,
"valid_targets_min": 759
},
{
"epoch": 1.271746944644141,
"grad_norm": 0.5900526270016355,
"learning_rate": 3.920010561476657e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1541575938463211,
"step": 885,
"valid_targets_mean": 3725.8,
"valid_targets_min": 739
},
{
"epoch": 1.2789360172537743,
"grad_norm": 0.5424428958428384,
"learning_rate": 3.9179918792885516e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1631605625152588,
"step": 890,
"valid_targets_mean": 5033.8,
"valid_targets_min": 3917
},
{
"epoch": 1.2861250898634076,
"grad_norm": 0.562110119178797,
"learning_rate": 3.915948573873804e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13708816468715668,
"step": 895,
"valid_targets_mean": 2972.0,
"valid_targets_min": 533
},
{
"epoch": 1.2933141624730409,
"grad_norm": 0.5251225453501762,
"learning_rate": 3.913880671464418e-05,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10703599452972412,
"step": 900,
"valid_targets_mean": 3083.0,
"valid_targets_min": 531
},
{
"epoch": 1.3005032350826744,
"grad_norm": 0.527255808693065,
"learning_rate": 3.911788198608177e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12984885275363922,
"step": 905,
"valid_targets_mean": 3227.2,
"valid_targets_min": 633
},
{
"epoch": 1.3076923076923077,
"grad_norm": 0.5523871978932965,
"learning_rate": 3.909671182168297e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515636146068573,
"step": 910,
"valid_targets_mean": 3423.0,
"valid_targets_min": 567
},
{
"epoch": 1.314881380301941,
"grad_norm": 0.5458514275613986,
"learning_rate": 3.907529649323088e-05,
"loss": 0.295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18874332308769226,
"step": 915,
"valid_targets_mean": 4317.4,
"valid_targets_min": 1326
},
{
"epoch": 1.3220704529115745,
"grad_norm": 0.5171016490633233,
"learning_rate": 3.905363627565601e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13986511528491974,
"step": 920,
"valid_targets_mean": 4300.5,
"valid_targets_min": 655
},
{
"epoch": 1.3292595255212079,
"grad_norm": 0.5446205102221678,
"learning_rate": 3.903173144703275e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12331528216600418,
"step": 925,
"valid_targets_mean": 3761.5,
"valid_targets_min": 650
},
{
"epoch": 1.3364485981308412,
"grad_norm": 0.5666138697419204,
"learning_rate": 3.900958228857585e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16033025085926056,
"step": 930,
"valid_targets_mean": 4147.9,
"valid_targets_min": 625
},
{
"epoch": 1.3436376707404745,
"grad_norm": 0.6532210361778743,
"learning_rate": 3.898718908463672e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1362089365720749,
"step": 935,
"valid_targets_mean": 2751.1,
"valid_targets_min": 593
},
{
"epoch": 1.3508267433501078,
"grad_norm": 0.5051696538336935,
"learning_rate": 3.896455212269988e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12954682111740112,
"step": 940,
"valid_targets_mean": 3428.1,
"valid_targets_min": 846
},
{
"epoch": 1.358015815959741,
"grad_norm": 0.5736534132040085,
"learning_rate": 3.894167169337919e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1548313945531845,
"step": 945,
"valid_targets_mean": 3938.4,
"valid_targets_min": 675
},
{
"epoch": 1.3652048885693746,
"grad_norm": 0.4938670698885232,
"learning_rate": 3.891854809041417e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12290967255830765,
"step": 950,
"valid_targets_mean": 4109.2,
"valid_targets_min": 800
},
{
"epoch": 1.372393961179008,
"grad_norm": 0.5938911117965663,
"learning_rate": 3.8895181610666196e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14941787719726562,
"step": 955,
"valid_targets_mean": 3038.4,
"valid_targets_min": 545
},
{
"epoch": 1.3795830337886412,
"grad_norm": 0.521484016781839,
"learning_rate": 3.8871572554114696e-05,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749972552061081,
"step": 960,
"valid_targets_mean": 4396.4,
"valid_targets_min": 608
},
{
"epoch": 1.3867721063982748,
"grad_norm": 0.5176443132865125,
"learning_rate": 3.8847721223853334e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1388823539018631,
"step": 965,
"valid_targets_mean": 4115.0,
"valid_targets_min": 753
},
{
"epoch": 1.393961179007908,
"grad_norm": 0.5872567204224207,
"learning_rate": 3.882362792608606e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21744276583194733,
"step": 970,
"valid_targets_mean": 4367.5,
"valid_targets_min": 655
},
{
"epoch": 1.4011502516175414,
"grad_norm": 0.56539435990809,
"learning_rate": 3.879929297012321e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14727197587490082,
"step": 975,
"valid_targets_mean": 3567.1,
"valid_targets_min": 516
},
{
"epoch": 1.4083393242271747,
"grad_norm": 0.5059918570200229,
"learning_rate": 3.877471666837756e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14970964193344116,
"step": 980,
"valid_targets_mean": 4185.9,
"valid_targets_min": 3115
},
{
"epoch": 1.415528396836808,
"grad_norm": 0.5163164050679078,
"learning_rate": 3.874989933636028e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12308366596698761,
"step": 985,
"valid_targets_mean": 3170.4,
"valid_targets_min": 566
},
{
"epoch": 1.4227174694464413,
"grad_norm": 0.5522952793806271,
"learning_rate": 3.872484129267686e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17238599061965942,
"step": 990,
"valid_targets_mean": 3889.1,
"valid_targets_min": 588
},
{
"epoch": 1.4299065420560748,
"grad_norm": 0.5961879603097092,
"learning_rate": 3.869954285902309e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15300405025482178,
"step": 995,
"valid_targets_mean": 3697.9,
"valid_targets_min": 592
},
{
"epoch": 1.4370956146657081,
"grad_norm": 0.47392520471736505,
"learning_rate": 3.8674004360180886e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14228011667728424,
"step": 1000,
"valid_targets_mean": 4135.2,
"valid_targets_min": 516
},
{
"epoch": 1.4442846872753414,
"grad_norm": 0.59329784213223,
"learning_rate": 3.864822612401411e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12148600816726685,
"step": 1005,
"valid_targets_mean": 2810.2,
"valid_targets_min": 415
},
{
"epoch": 1.451473759884975,
"grad_norm": 0.5156223018651376,
"learning_rate": 3.86222084814644e-05,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2099960893392563,
"step": 1010,
"valid_targets_mean": 4676.2,
"valid_targets_min": 954
},
{
"epoch": 1.4586628324946083,
"grad_norm": 0.5929213995699328,
"learning_rate": 3.8595951766546874e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18259933590888977,
"step": 1015,
"valid_targets_mean": 3383.6,
"valid_targets_min": 589
},
{
"epoch": 1.4658519051042416,
"grad_norm": 0.44437186370848597,
"learning_rate": 3.856945631634589e-05,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11551199853420258,
"step": 1020,
"valid_targets_mean": 3701.6,
"valid_targets_min": 524
},
{
"epoch": 1.4730409777138749,
"grad_norm": 0.5072064763974775,
"learning_rate": 3.854272247101068e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14987875521183014,
"step": 1025,
"valid_targets_mean": 4569.1,
"valid_targets_min": 612
},
{
"epoch": 1.4802300503235082,
"grad_norm": 0.4655200344372254,
"learning_rate": 3.851575057375101e-05,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1204090267419815,
"step": 1030,
"valid_targets_mean": 3899.2,
"valid_targets_min": 617
},
{
"epoch": 1.4874191229331415,
"grad_norm": 0.5728562126071537,
"learning_rate": 3.8488540970832754e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1308048665523529,
"step": 1035,
"valid_targets_mean": 2915.0,
"valid_targets_min": 477
},
{
"epoch": 1.494608195542775,
"grad_norm": 0.5511649364727081,
"learning_rate": 3.846109401157345e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09357282519340515,
"step": 1040,
"valid_targets_mean": 1808.2,
"valid_targets_min": 486
},
{
"epoch": 1.5017972681524083,
"grad_norm": 0.5296838223120048,
"learning_rate": 3.843341004833784e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15539321303367615,
"step": 1045,
"valid_targets_mean": 4149.1,
"valid_targets_min": 861
},
{
"epoch": 1.5089863407620419,
"grad_norm": 0.5461095453788049,
"learning_rate": 3.840548943653333e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12287761270999908,
"step": 1050,
"valid_targets_mean": 2310.9,
"valid_targets_min": 730
},
{
"epoch": 1.5161754133716752,
"grad_norm": 0.5100354908552306,
"learning_rate": 3.83773325346054e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14473143219947815,
"step": 1055,
"valid_targets_mean": 4014.5,
"valid_targets_min": 887
},
{
"epoch": 1.5233644859813085,
"grad_norm": 0.5226379950787434,
"learning_rate": 3.834893970403306e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13530033826828003,
"step": 1060,
"valid_targets_mean": 2959.1,
"valid_targets_min": 653
},
{
"epoch": 1.5305535585909418,
"grad_norm": 0.5566617697030245,
"learning_rate": 3.832031130932415e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12731043994426727,
"step": 1065,
"valid_targets_mean": 3113.8,
"valid_targets_min": 660
},
{
"epoch": 1.537742631200575,
"grad_norm": 0.4513676317081486,
"learning_rate": 3.8291447718010706e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11857186257839203,
"step": 1070,
"valid_targets_mean": 4130.1,
"valid_targets_min": 581
},
{
"epoch": 1.5449317038102084,
"grad_norm": 0.5703581165114259,
"learning_rate": 3.826234930064422e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13232873380184174,
"step": 1075,
"valid_targets_mean": 3404.8,
"valid_targets_min": 888
},
{
"epoch": 1.5521207764198417,
"grad_norm": 0.5209632185141453,
"learning_rate": 3.82330164307909e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12993882596492767,
"step": 1080,
"valid_targets_mean": 3908.0,
"valid_targets_min": 535
},
{
"epoch": 1.5593098490294752,
"grad_norm": 0.5068701501791201,
"learning_rate": 3.820344948502682e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20242813229560852,
"step": 1085,
"valid_targets_mean": 4670.1,
"valid_targets_min": 1088
},
{
"epoch": 1.5664989216391085,
"grad_norm": 0.5323592122608582,
"learning_rate": 3.8173648842933173e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1509951651096344,
"step": 1090,
"valid_targets_mean": 5006.2,
"valid_targets_min": 3176
},
{
"epoch": 1.573687994248742,
"grad_norm": 0.6152354366056297,
"learning_rate": 3.814361488709132e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16126582026481628,
"step": 1095,
"valid_targets_mean": 3042.6,
"valid_targets_min": 673
},
{
"epoch": 1.5808770668583754,
"grad_norm": 0.5961551035844662,
"learning_rate": 3.8113348003077926e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12394510954618454,
"step": 1100,
"valid_targets_mean": 3242.1,
"valid_targets_min": 573
},
{
"epoch": 1.5880661394680087,
"grad_norm": 0.47980821001671486,
"learning_rate": 3.808284857945999e-05,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1280575692653656,
"step": 1105,
"valid_targets_mean": 4582.2,
"valid_targets_min": 607
},
{
"epoch": 1.595255212077642,
"grad_norm": 0.507500812907104,
"learning_rate": 3.805211700778984e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13678506016731262,
"step": 1110,
"valid_targets_mean": 3753.8,
"valid_targets_min": 720
},
{
"epoch": 1.6024442846872753,
"grad_norm": 0.49705689698484373,
"learning_rate": 3.802115368260016e-05,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15146461129188538,
"step": 1115,
"valid_targets_mean": 3863.8,
"valid_targets_min": 770
},
{
"epoch": 1.6096333572969086,
"grad_norm": 0.43272714289145614,
"learning_rate": 3.798995900139889e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11581413447856903,
"step": 1120,
"valid_targets_mean": 4227.2,
"valid_targets_min": 905
},
{
"epoch": 1.616822429906542,
"grad_norm": 0.6434087265414399,
"learning_rate": 3.795853336466408e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1903274953365326,
"step": 1125,
"valid_targets_mean": 3343.6,
"valid_targets_min": 708
},
{
"epoch": 1.6240115025161754,
"grad_norm": 0.5786733657323256,
"learning_rate": 3.7926877175838844e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2227598875761032,
"step": 1130,
"valid_targets_mean": 3601.8,
"valid_targets_min": 706
},
{
"epoch": 1.6312005751258087,
"grad_norm": 0.5216255139577858,
"learning_rate": 3.7894990841326095e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19719943404197693,
"step": 1135,
"valid_targets_mean": 4424.4,
"valid_targets_min": 1563
},
{
"epoch": 1.6383896477354423,
"grad_norm": 0.47385348746292455,
"learning_rate": 3.786287477048338e-05,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14471015334129333,
"step": 1140,
"valid_targets_mean": 4585.0,
"valid_targets_min": 758
},
{
"epoch": 1.6455787203450756,
"grad_norm": 0.496509144966886,
"learning_rate": 3.783052937561762e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12411241978406906,
"step": 1145,
"valid_targets_mean": 3547.8,
"valid_targets_min": 727
},
{
"epoch": 1.6527677929547089,
"grad_norm": 0.5337477757052604,
"learning_rate": 3.779795507197975e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12069012969732285,
"step": 1150,
"valid_targets_mean": 2619.9,
"valid_targets_min": 630
},
{
"epoch": 1.6599568655643422,
"grad_norm": 0.555030233675228,
"learning_rate": 3.77651522777595e-05,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1416761577129364,
"step": 1155,
"valid_targets_mean": 2981.6,
"valid_targets_min": 543
},
{
"epoch": 1.6671459381739755,
"grad_norm": 0.5314725659453191,
"learning_rate": 3.773212141407994e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1304677575826645,
"step": 1160,
"valid_targets_mean": 3663.9,
"valid_targets_min": 661
},
{
"epoch": 1.6743350107836088,
"grad_norm": 0.557105621995766,
"learning_rate": 3.769886290499211e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14408347010612488,
"step": 1165,
"valid_targets_mean": 3259.2,
"valid_targets_min": 670
},
{
"epoch": 1.681524083393242,
"grad_norm": 0.5236188088487769,
"learning_rate": 3.766537717746955e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13859708607196808,
"step": 1170,
"valid_targets_mean": 3392.2,
"valid_targets_min": 491
},
{
"epoch": 1.6887131560028756,
"grad_norm": 0.47979346096235626,
"learning_rate": 3.7631664661402854e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1257590651512146,
"step": 1175,
"valid_targets_mean": 4215.4,
"valid_targets_min": 964
},
{
"epoch": 1.695902228612509,
"grad_norm": 0.5549812009815447,
"learning_rate": 3.759772578959413e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14304929971694946,
"step": 1180,
"valid_targets_mean": 2919.5,
"valid_targets_min": 635
},
{
"epoch": 1.7030913012221425,
"grad_norm": 0.5100981619143163,
"learning_rate": 3.7563560997751453e-05,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12205301225185394,
"step": 1185,
"valid_targets_mean": 3287.5,
"valid_targets_min": 297
},
{
"epoch": 1.7102803738317758,
"grad_norm": 0.5542814369344694,
"learning_rate": 3.752917072448324e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1393413543701172,
"step": 1190,
"valid_targets_mean": 3343.5,
"valid_targets_min": 532
},
{
"epoch": 1.717469446441409,
"grad_norm": 0.5004127002541743,
"learning_rate": 3.7494555411292665e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14154654741287231,
"step": 1195,
"valid_targets_mean": 3552.9,
"valid_targets_min": 882
},
{
"epoch": 1.7246585190510424,
"grad_norm": 0.5369377603113736,
"learning_rate": 3.7459715502571974e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14404495060443878,
"step": 1200,
"valid_targets_mean": 3497.0,
"valid_targets_min": 732
},
{
"epoch": 1.7318475916606757,
"grad_norm": 0.5692617287750511,
"learning_rate": 3.742465144559675e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14669956266880035,
"step": 1205,
"valid_targets_mean": 2881.1,
"valid_targets_min": 617
},
{
"epoch": 1.739036664270309,
"grad_norm": 0.5065041606981532,
"learning_rate": 3.7389363690520236e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10892973095178604,
"step": 1210,
"valid_targets_mean": 3190.4,
"valid_targets_min": 861
},
{
"epoch": 1.7462257368799425,
"grad_norm": 0.5083030454665067,
"learning_rate": 3.735385269036747e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15521150827407837,
"step": 1215,
"valid_targets_mean": 3963.9,
"valid_targets_min": 663
},
{
"epoch": 1.7534148094895758,
"grad_norm": 0.44482574218300447,
"learning_rate": 3.731811890102956e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1155744269490242,
"step": 1220,
"valid_targets_mean": 3604.9,
"valid_targets_min": 770
},
{
"epoch": 1.7606038820992091,
"grad_norm": 0.539860187359408,
"learning_rate": 3.728216278125776e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15875539183616638,
"step": 1225,
"valid_targets_mean": 3555.1,
"valid_targets_min": 745
},
{
"epoch": 1.7677929547088427,
"grad_norm": 0.4410205993807063,
"learning_rate": 3.724598479265761e-05,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12200931459665298,
"step": 1230,
"valid_targets_mean": 4136.0,
"valid_targets_min": 583
},
{
"epoch": 1.774982027318476,
"grad_norm": 0.49605181628499445,
"learning_rate": 3.720958539968302e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15854984521865845,
"step": 1235,
"valid_targets_mean": 3980.0,
"valid_targets_min": 412
},
{
"epoch": 1.7821710999281093,
"grad_norm": 0.5097674785148915,
"learning_rate": 3.7172965069630285e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12535299360752106,
"step": 1240,
"valid_targets_mean": 3590.9,
"valid_targets_min": 555
},
{
"epoch": 1.7893601725377426,
"grad_norm": 0.530740961884203,
"learning_rate": 3.713612427263209e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17841705679893494,
"step": 1245,
"valid_targets_mean": 4256.5,
"valid_targets_min": 785
},
{
"epoch": 1.796549245147376,
"grad_norm": 0.525125717742193,
"learning_rate": 3.70990634816515e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14326494932174683,
"step": 1250,
"valid_targets_mean": 2654.0,
"valid_targets_min": 567
},
{
"epoch": 1.8037383177570092,
"grad_norm": 0.47882978123124514,
"learning_rate": 3.706178317247585e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1471397876739502,
"step": 1255,
"valid_targets_mean": 4397.4,
"valid_targets_min": 593
},
{
"epoch": 1.8109273903666427,
"grad_norm": 0.5886031941773199,
"learning_rate": 3.702428382371066e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15693509578704834,
"step": 1260,
"valid_targets_mean": 2723.0,
"valid_targets_min": 448
},
{
"epoch": 1.818116462976276,
"grad_norm": 0.5664729440418096,
"learning_rate": 3.698656591677348e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09844028949737549,
"step": 1265,
"valid_targets_mean": 2811.0,
"valid_targets_min": 275
},
{
"epoch": 1.8253055355859096,
"grad_norm": 0.498049887694824,
"learning_rate": 3.694862993588774e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1390022337436676,
"step": 1270,
"valid_targets_mean": 4099.2,
"valid_targets_min": 3258
},
{
"epoch": 1.8324946081955429,
"grad_norm": 0.6036330907468369,
"learning_rate": 3.6910476368076466e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16148319840431213,
"step": 1275,
"valid_targets_mean": 3122.1,
"valid_targets_min": 648
},
{
"epoch": 1.8396836808051762,
"grad_norm": 0.5012127171683514,
"learning_rate": 3.6872105703156116e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11360730975866318,
"step": 1280,
"valid_targets_mean": 3105.0,
"valid_targets_min": 422
},
{
"epoch": 1.8468727534148095,
"grad_norm": 0.5151919144409882,
"learning_rate": 3.683351843373021e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16393089294433594,
"step": 1285,
"valid_targets_mean": 4949.4,
"valid_targets_min": 4000
},
{
"epoch": 1.8540618260244428,
"grad_norm": 0.5266250897243666,
"learning_rate": 3.679471505518306e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13978716731071472,
"step": 1290,
"valid_targets_mean": 3342.1,
"valid_targets_min": 767
},
{
"epoch": 1.8612508986340761,
"grad_norm": 0.49171130776521615,
"learning_rate": 3.67556960656734e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14079241454601288,
"step": 1295,
"valid_targets_mean": 3342.5,
"valid_targets_min": 726
},
{
"epoch": 1.8684399712437094,
"grad_norm": 0.49843468685276926,
"learning_rate": 3.6716461966127955e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14257866144180298,
"step": 1300,
"valid_targets_mean": 3800.0,
"valid_targets_min": 640
},
{
"epoch": 1.875629043853343,
"grad_norm": 0.5496180609804349,
"learning_rate": 3.6677013260235054e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16164788603782654,
"step": 1305,
"valid_targets_mean": 3051.6,
"valid_targets_min": 671
},
{
"epoch": 1.8828181164629763,
"grad_norm": 0.5170287488041243,
"learning_rate": 3.663735045443816e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16715139150619507,
"step": 1310,
"valid_targets_mean": 3631.0,
"valid_targets_min": 665
},
{
"epoch": 1.8900071890726098,
"grad_norm": 0.5086856038225003,
"learning_rate": 3.659747405792935e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1597132831811905,
"step": 1315,
"valid_targets_mean": 3384.6,
"valid_targets_min": 720
},
{
"epoch": 1.897196261682243,
"grad_norm": 0.5276886812025636,
"learning_rate": 3.655738458264275e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12705910205841064,
"step": 1320,
"valid_targets_mean": 3736.5,
"valid_targets_min": 593
},
{
"epoch": 1.9043853342918764,
"grad_norm": 0.47184848582856675,
"learning_rate": 3.651708254324805e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14923986792564392,
"step": 1325,
"valid_targets_mean": 4219.8,
"valid_targets_min": 505
},
{
"epoch": 1.9115744069015097,
"grad_norm": 0.5095295218556172,
"learning_rate": 3.64765684571438e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1307600885629654,
"step": 1330,
"valid_targets_mean": 3621.0,
"valid_targets_min": 977
},
{
"epoch": 1.918763479511143,
"grad_norm": 0.4994876634935122,
"learning_rate": 3.6435842844450834e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14474749565124512,
"step": 1335,
"valid_targets_mean": 3611.5,
"valid_targets_min": 678
},
{
"epoch": 1.9259525521207763,
"grad_norm": 0.8084296900592843,
"learning_rate": 3.639490622800557e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15133309364318848,
"step": 1340,
"valid_targets_mean": 3889.6,
"valid_targets_min": 903
},
{
"epoch": 1.9331416247304096,
"grad_norm": 0.47612540531078573,
"learning_rate": 3.635375913335328e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11670131981372833,
"step": 1345,
"valid_targets_mean": 3428.1,
"valid_targets_min": 620
},
{
"epoch": 1.9403306973400432,
"grad_norm": 0.5201381114302891,
"learning_rate": 3.631240208874138e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17568343877792358,
"step": 1350,
"valid_targets_mean": 4018.5,
"valid_targets_min": 771
},
{
"epoch": 1.9475197699496765,
"grad_norm": 0.5684687696419027,
"learning_rate": 3.627083562511262e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15264779329299927,
"step": 1355,
"valid_targets_mean": 4340.8,
"valid_targets_min": 502
},
{
"epoch": 1.95470884255931,
"grad_norm": 0.505802871570166,
"learning_rate": 3.622906027609826e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14337629079818726,
"step": 1360,
"valid_targets_mean": 3748.8,
"valid_targets_min": 482
},
{
"epoch": 1.9618979151689433,
"grad_norm": 0.5332734023712747,
"learning_rate": 3.618707657801127e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12836483120918274,
"step": 1365,
"valid_targets_mean": 3103.9,
"valid_targets_min": 596
},
{
"epoch": 1.9690869877785766,
"grad_norm": 0.5021612024263556,
"learning_rate": 3.614488506983939e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14348819851875305,
"step": 1370,
"valid_targets_mean": 4130.9,
"valid_targets_min": 851
},
{
"epoch": 1.97627606038821,
"grad_norm": 0.610411285067793,
"learning_rate": 3.6102486293238236e-05,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15583057701587677,
"step": 1375,
"valid_targets_mean": 3433.0,
"valid_targets_min": 538
},
{
"epoch": 1.9834651329978432,
"grad_norm": 0.49020599604774884,
"learning_rate": 3.6059880792524326e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10183790326118469,
"step": 1380,
"valid_targets_mean": 2611.9,
"valid_targets_min": 712
},
{
"epoch": 1.9906542056074765,
"grad_norm": 0.4649398951912101,
"learning_rate": 3.601706911466813e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11849203705787659,
"step": 1385,
"valid_targets_mean": 4027.6,
"valid_targets_min": 918
},
{
"epoch": 1.9978432782171098,
"grad_norm": 0.5652715236268022,
"learning_rate": 3.597405180928701e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16841626167297363,
"step": 1390,
"valid_targets_mean": 4007.5,
"valid_targets_min": 821
},
{
"epoch": 2.00431344356578,
"grad_norm": 0.44042475910319384,
"learning_rate": 3.5930829428638195e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12045784294605255,
"step": 1395,
"valid_targets_mean": 3999.5,
"valid_targets_min": 286
},
{
"epoch": 2.011502516175413,
"grad_norm": 0.46014945634483034,
"learning_rate": 3.588740252761165e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15798038244247437,
"step": 1400,
"valid_targets_mean": 5402.1,
"valid_targets_min": 3999
},
{
"epoch": 2.0186915887850465,
"grad_norm": 0.5864474166210711,
"learning_rate": 3.5843771663722994e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14607274532318115,
"step": 1405,
"valid_targets_mean": 2451.4,
"valid_targets_min": 606
},
{
"epoch": 2.0258806613946803,
"grad_norm": 0.5922859588085109,
"learning_rate": 3.5799937397106336e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.149421826004982,
"step": 1410,
"valid_targets_mean": 3078.4,
"valid_targets_min": 615
},
{
"epoch": 2.0330697340043136,
"grad_norm": 0.576123978661105,
"learning_rate": 3.575590029050705e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1341801881790161,
"step": 1415,
"valid_targets_mean": 2612.0,
"valid_targets_min": 694
},
{
"epoch": 2.040258806613947,
"grad_norm": 0.5001343696732509,
"learning_rate": 3.57116609092746e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16290068626403809,
"step": 1420,
"valid_targets_mean": 4209.9,
"valid_targets_min": 783
},
{
"epoch": 2.04744787922358,
"grad_norm": 0.47175040208647506,
"learning_rate": 3.5667219821355226e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12168647348880768,
"step": 1425,
"valid_targets_mean": 4308.9,
"valid_targets_min": 721
},
{
"epoch": 2.0546369518332135,
"grad_norm": 0.5196704922805649,
"learning_rate": 3.5622577597284724e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13878659904003143,
"step": 1430,
"valid_targets_mean": 4093.0,
"valid_targets_min": 882
},
{
"epoch": 2.061826024442847,
"grad_norm": 0.5477085097658387,
"learning_rate": 3.557773481018104e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11407799273729324,
"step": 1435,
"valid_targets_mean": 2638.8,
"valid_targets_min": 551
},
{
"epoch": 2.06901509705248,
"grad_norm": 0.47586536612060937,
"learning_rate": 3.5532692035736975e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11465832591056824,
"step": 1440,
"valid_targets_mean": 3847.8,
"valid_targets_min": 671
},
{
"epoch": 2.0762041696621134,
"grad_norm": 0.6396794264804806,
"learning_rate": 3.548744985221277e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09672622382640839,
"step": 1445,
"valid_targets_mean": 2118.6,
"valid_targets_min": 706
},
{
"epoch": 2.083393242271747,
"grad_norm": 0.5908485673059465,
"learning_rate": 3.544200884042869e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11773449927568436,
"step": 1450,
"valid_targets_mean": 2278.6,
"valid_targets_min": 606
},
{
"epoch": 2.0905823148813805,
"grad_norm": 0.9011502937614828,
"learning_rate": 3.539636958375755e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1216643825173378,
"step": 1455,
"valid_targets_mean": 2758.0,
"valid_targets_min": 652
},
{
"epoch": 2.0977713874910138,
"grad_norm": 0.5586718911086384,
"learning_rate": 3.535053266811725e-05,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1211056336760521,
"step": 1460,
"valid_targets_mean": 2683.1,
"valid_targets_min": 586
},
{
"epoch": 2.104960460100647,
"grad_norm": 0.49054572735296403,
"learning_rate": 3.5304498681963216e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12743888795375824,
"step": 1465,
"valid_targets_mean": 3772.6,
"valid_targets_min": 916
},
{
"epoch": 2.1121495327102804,
"grad_norm": 0.5650208920966238,
"learning_rate": 3.52582682162809e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14947383105754852,
"step": 1470,
"valid_targets_mean": 2826.8,
"valid_targets_min": 499
},
{
"epoch": 2.1193386053199137,
"grad_norm": 0.45465073195112815,
"learning_rate": 3.521184186457815e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13897745311260223,
"step": 1475,
"valid_targets_mean": 4228.9,
"valid_targets_min": 575
},
{
"epoch": 2.126527677929547,
"grad_norm": 0.5735246322929461,
"learning_rate": 3.51652202228776e-05,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17849652469158173,
"step": 1480,
"valid_targets_mean": 4539.4,
"valid_targets_min": 734
},
{
"epoch": 2.1337167505391803,
"grad_norm": 0.6091822343999242,
"learning_rate": 3.511840388970903e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.145311176776886,
"step": 1485,
"valid_targets_mean": 2660.6,
"valid_targets_min": 206
},
{
"epoch": 2.1409058231488136,
"grad_norm": 0.5177727754454414,
"learning_rate": 3.507139346610167e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13099326193332672,
"step": 1490,
"valid_targets_mean": 3336.1,
"valid_targets_min": 500
},
{
"epoch": 2.1480948957584474,
"grad_norm": 0.47860594671573575,
"learning_rate": 3.502418955557649e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10694457590579987,
"step": 1495,
"valid_targets_mean": 3990.4,
"valid_targets_min": 616
},
{
"epoch": 2.1552839683680807,
"grad_norm": 0.5251786287771435,
"learning_rate": 3.4976792764138446e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09503109753131866,
"step": 1500,
"valid_targets_mean": 2990.2,
"valid_targets_min": 670
},
{
"epoch": 2.162473040977714,
"grad_norm": 0.4993754918391816,
"learning_rate": 3.4929203700268706e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11814264208078384,
"step": 1505,
"valid_targets_mean": 3831.6,
"valid_targets_min": 802
},
{
"epoch": 2.1696621135873473,
"grad_norm": 0.5661575463954994,
"learning_rate": 3.488142297491683e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11874938011169434,
"step": 1510,
"valid_targets_mean": 3086.4,
"valid_targets_min": 599
},
{
"epoch": 2.1768511861969806,
"grad_norm": 0.5826772519983847,
"learning_rate": 3.483345120149294e-05,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15646061301231384,
"step": 1515,
"valid_targets_mean": 3559.1,
"valid_targets_min": 242
},
{
"epoch": 2.184040258806614,
"grad_norm": 0.5139252289446473,
"learning_rate": 3.4785288995859835e-05,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13239224255084991,
"step": 1520,
"valid_targets_mean": 3718.9,
"valid_targets_min": 503
},
{
"epoch": 2.191229331416247,
"grad_norm": 0.4982519981602888,
"learning_rate": 3.4736936976325094e-05,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15333423018455505,
"step": 1525,
"valid_targets_mean": 4679.8,
"valid_targets_min": 693
},
{
"epoch": 2.1984184040258805,
"grad_norm": 0.48520099933200456,
"learning_rate": 3.468839576363313e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15786109864711761,
"step": 1530,
"valid_targets_mean": 4654.2,
"valid_targets_min": 3386
},
{
"epoch": 2.205607476635514,
"grad_norm": 0.5104245415475017,
"learning_rate": 3.463966598095721e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12429475039243698,
"step": 1535,
"valid_targets_mean": 3454.0,
"valid_targets_min": 694
},
{
"epoch": 2.2127965492451476,
"grad_norm": 0.5657497859202579,
"learning_rate": 3.459074825389147e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.141516774892807,
"step": 1540,
"valid_targets_mean": 3773.1,
"valid_targets_min": 647
},
{
"epoch": 2.219985621854781,
"grad_norm": 0.5163287527650611,
"learning_rate": 3.4541643210442895e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17117419838905334,
"step": 1545,
"valid_targets_mean": 5093.4,
"valid_targets_min": 745
},
{
"epoch": 2.227174694464414,
"grad_norm": 0.5564079368258821,
"learning_rate": 3.4492351481023236e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19022008776664734,
"step": 1550,
"valid_targets_mean": 4066.0,
"valid_targets_min": 635
},
{
"epoch": 2.2343637670740475,
"grad_norm": 0.5397979967201494,
"learning_rate": 3.444287369844092e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09026080369949341,
"step": 1555,
"valid_targets_mean": 1724.5,
"valid_targets_min": 221
},
{
"epoch": 2.241552839683681,
"grad_norm": 0.4815453466365358,
"learning_rate": 3.439321049789292e-05,
"loss": 0.2684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11930803209543228,
"step": 1560,
"valid_targets_mean": 3645.6,
"valid_targets_min": 619
},
{
"epoch": 2.248741912293314,
"grad_norm": 0.5625767162580588,
"learning_rate": 3.434336251695663e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10417810082435608,
"step": 1565,
"valid_targets_mean": 2749.9,
"valid_targets_min": 578
},
{
"epoch": 2.2559309849029474,
"grad_norm": 0.5803374667156413,
"learning_rate": 3.429333039558164e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408432126045227,
"step": 1570,
"valid_targets_mean": 3556.9,
"valid_targets_min": 769
},
{
"epoch": 2.2631200575125807,
"grad_norm": 0.5223520497569117,
"learning_rate": 3.424311477608155e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14780449867248535,
"step": 1575,
"valid_targets_mean": 4020.1,
"valid_targets_min": 629
},
{
"epoch": 2.2703091301222145,
"grad_norm": 0.5120310717401553,
"learning_rate": 3.419271630312571e-05,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09790432453155518,
"step": 1580,
"valid_targets_mean": 3122.2,
"valid_targets_min": 474
},
{
"epoch": 2.2774982027318478,
"grad_norm": 0.5335207312364842,
"learning_rate": 3.4142135623730954e-05,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15345562994480133,
"step": 1585,
"valid_targets_mean": 3602.5,
"valid_targets_min": 925
},
{
"epoch": 2.284687275341481,
"grad_norm": 0.5126000830068731,
"learning_rate": 3.4091373387253275e-05,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684829741716385,
"step": 1590,
"valid_targets_mean": 4178.2,
"valid_targets_min": 516
},
{
"epoch": 2.2918763479511144,
"grad_norm": 0.48256289234266836,
"learning_rate": 3.4040430245379504e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11229759454727173,
"step": 1595,
"valid_targets_mean": 3424.4,
"valid_targets_min": 605
},
{
"epoch": 2.2990654205607477,
"grad_norm": 0.55020456280713,
"learning_rate": 3.398930685211895e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11756587028503418,
"step": 1600,
"valid_targets_mean": 3094.5,
"valid_targets_min": 497
},
{
"epoch": 2.306254493170381,
"grad_norm": 0.441903715964592,
"learning_rate": 3.3938003863794985e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11097332835197449,
"step": 1605,
"valid_targets_mean": 3508.8,
"valid_targets_min": 613
},
{
"epoch": 2.3134435657800143,
"grad_norm": 0.5014046749229496,
"learning_rate": 3.3886521939036615e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1317036747932434,
"step": 1610,
"valid_targets_mean": 3808.2,
"valid_targets_min": 755
},
{
"epoch": 2.3206326383896476,
"grad_norm": 0.5329301293062252,
"learning_rate": 3.383486173877006e-05,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12639915943145752,
"step": 1615,
"valid_targets_mean": 3335.2,
"valid_targets_min": 804
},
{
"epoch": 2.327821710999281,
"grad_norm": 0.5057564917431732,
"learning_rate": 3.378302392621023e-05,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15294601023197174,
"step": 1620,
"valid_targets_mean": 3938.2,
"valid_targets_min": 612
},
{
"epoch": 2.3350107836089142,
"grad_norm": 0.5552358600783263,
"learning_rate": 3.3731009166852234e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16431793570518494,
"step": 1625,
"valid_targets_mean": 4337.2,
"valid_targets_min": 1382
},
{
"epoch": 2.342199856218548,
"grad_norm": 0.4430784978799377,
"learning_rate": 3.367881812846282e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.118332639336586,
"step": 1630,
"valid_targets_mean": 3640.8,
"valid_targets_min": 470
},
{
"epoch": 2.3493889288281813,
"grad_norm": 0.492835719915706,
"learning_rate": 3.362645148107183e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13531847298145294,
"step": 1635,
"valid_targets_mean": 3750.9,
"valid_targets_min": 586
},
{
"epoch": 2.3565780014378146,
"grad_norm": 0.49387897152804017,
"learning_rate": 3.357390989696353e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12371513247489929,
"step": 1640,
"valid_targets_mean": 3756.9,
"valid_targets_min": 723
},
{
"epoch": 2.363767074047448,
"grad_norm": 0.5292204315605716,
"learning_rate": 3.352119405066809e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1294528990983963,
"step": 1645,
"valid_targets_mean": 3740.4,
"valid_targets_min": 726
},
{
"epoch": 2.370956146657081,
"grad_norm": 0.5482500192647483,
"learning_rate": 3.346830461895283e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11841487884521484,
"step": 1650,
"valid_targets_mean": 3236.2,
"valid_targets_min": 617
},
{
"epoch": 2.3781452192667145,
"grad_norm": 0.5569155952182551,
"learning_rate": 3.3415242280813567e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16182178258895874,
"step": 1655,
"valid_targets_mean": 3206.0,
"valid_targets_min": 643
},
{
"epoch": 2.385334291876348,
"grad_norm": 0.4187873978975146,
"learning_rate": 3.3362007717465884e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12652206420898438,
"step": 1660,
"valid_targets_mean": 4757.6,
"valid_targets_min": 995
},
{
"epoch": 2.392523364485981,
"grad_norm": 0.48405464845552704,
"learning_rate": 3.330860161233642e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13703463971614838,
"step": 1665,
"valid_targets_mean": 3936.0,
"valid_targets_min": 779
},
{
"epoch": 2.399712437095615,
"grad_norm": 0.525936038970634,
"learning_rate": 3.3255024651054045e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976655125617981,
"step": 1670,
"valid_targets_mean": 4660.8,
"valid_targets_min": 2417
},
{
"epoch": 2.406901509705248,
"grad_norm": 0.48342772806241563,
"learning_rate": 3.320127752144111e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18336616456508636,
"step": 1675,
"valid_targets_mean": 5358.4,
"valid_targets_min": 895
},
{
"epoch": 2.4140905823148815,
"grad_norm": 0.5414300080613395,
"learning_rate": 3.314736091350458e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16382211446762085,
"step": 1680,
"valid_targets_mean": 4076.9,
"valid_targets_min": 950
},
{
"epoch": 2.421279654924515,
"grad_norm": 0.5247367013493369,
"learning_rate": 3.3093275519427175e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1400073617696762,
"step": 1685,
"valid_targets_mean": 3772.5,
"valid_targets_min": 913
},
{
"epoch": 2.428468727534148,
"grad_norm": 0.5038530432636198,
"learning_rate": 3.303902203355852e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08247102051973343,
"step": 1690,
"valid_targets_mean": 2354.1,
"valid_targets_min": 480
},
{
"epoch": 2.4356578001437814,
"grad_norm": 0.47032603091705133,
"learning_rate": 3.2984601152406176e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12384230643510818,
"step": 1695,
"valid_targets_mean": 3688.6,
"valid_targets_min": 554
},
{
"epoch": 2.4428468727534147,
"grad_norm": 0.6205205557490409,
"learning_rate": 3.293001357462676e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11945857107639313,
"step": 1700,
"valid_targets_mean": 2112.8,
"valid_targets_min": 489
},
{
"epoch": 2.450035945363048,
"grad_norm": 0.58735452653188,
"learning_rate": 3.287526000101693e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14614614844322205,
"step": 1705,
"valid_targets_mean": 2608.5,
"valid_targets_min": 638
},
{
"epoch": 2.4572250179726813,
"grad_norm": 0.5529963455269361,
"learning_rate": 3.28203411345044e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15596972405910492,
"step": 1710,
"valid_targets_mean": 3632.6,
"valid_targets_min": 789
},
{
"epoch": 2.4644140905823146,
"grad_norm": 0.46547199433659353,
"learning_rate": 3.2765257680138914e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12506428360939026,
"step": 1715,
"valid_targets_mean": 4817.8,
"valid_targets_min": 3107
},
{
"epoch": 2.4716031631919484,
"grad_norm": 0.4630677382270778,
"learning_rate": 3.271001034508321e-05,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15703052282333374,
"step": 1720,
"valid_targets_mean": 4160.2,
"valid_targets_min": 847
},
{
"epoch": 2.4787922358015817,
"grad_norm": 0.537284473855485,
"learning_rate": 3.2654599838603934e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11568139493465424,
"step": 1725,
"valid_targets_mean": 2814.8,
"valid_targets_min": 615
},
{
"epoch": 2.485981308411215,
"grad_norm": 0.5363135175126315,
"learning_rate": 3.259902687206251e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10325951129198074,
"step": 1730,
"valid_targets_mean": 2743.4,
"valid_targets_min": 604
},
{
"epoch": 2.4931703810208483,
"grad_norm": 0.49958194974316356,
"learning_rate": 3.254329215890605e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14953942596912384,
"step": 1735,
"valid_targets_mean": 4127.9,
"valid_targets_min": 792
},
{
"epoch": 2.5003594536304816,
"grad_norm": 0.47782238311011827,
"learning_rate": 3.2487396414658175e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.093122698366642,
"step": 1740,
"valid_targets_mean": 2792.6,
"valid_targets_min": 766
},
{
"epoch": 2.507548526240115,
"grad_norm": 0.49969197033552243,
"learning_rate": 3.2431340356909785e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13741299510002136,
"step": 1745,
"valid_targets_mean": 3782.9,
"valid_targets_min": 978
},
{
"epoch": 2.5147375988497482,
"grad_norm": 0.48532507278419035,
"learning_rate": 3.2375124705309956e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1263132393360138,
"step": 1750,
"valid_targets_mean": 3629.0,
"valid_targets_min": 706
},
{
"epoch": 2.521926671459382,
"grad_norm": 0.4891347428964143,
"learning_rate": 3.2318750181556575e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13069723546504974,
"step": 1755,
"valid_targets_mean": 3528.9,
"valid_targets_min": 708
},
{
"epoch": 2.5291157440690153,
"grad_norm": 0.5186284903213042,
"learning_rate": 3.226221750938716e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595681756734848,
"step": 1760,
"valid_targets_mean": 3760.9,
"valid_targets_min": 832
},
{
"epoch": 2.5363048166786486,
"grad_norm": 0.48093912887760065,
"learning_rate": 3.220552741456954e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15026655793190002,
"step": 1765,
"valid_targets_mean": 4527.4,
"valid_targets_min": 934
},
{
"epoch": 2.543493889288282,
"grad_norm": 0.4814466453376168,
"learning_rate": 3.214868062489254e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13298210501670837,
"step": 1770,
"valid_targets_mean": 3778.2,
"valid_targets_min": 675
},
{
"epoch": 2.550682961897915,
"grad_norm": 0.4969943214307037,
"learning_rate": 3.209167787015663e-05,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15883077681064606,
"step": 1775,
"valid_targets_mean": 4380.6,
"valid_targets_min": 647
},
{
"epoch": 2.5578720345075485,
"grad_norm": 0.4560608460390592,
"learning_rate": 3.203451988216458e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11129967868328094,
"step": 1780,
"valid_targets_mean": 3518.4,
"valid_targets_min": 577
},
{
"epoch": 2.565061107117182,
"grad_norm": 0.5037014636875286,
"learning_rate": 3.197720739471202e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15875720977783203,
"step": 1785,
"valid_targets_mean": 4701.8,
"valid_targets_min": 753
},
{
"epoch": 2.572250179726815,
"grad_norm": 0.472938402206803,
"learning_rate": 3.1919741143578086e-05,
"loss": 0.2735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12956391274929047,
"step": 1790,
"valid_targets_mean": 4941.9,
"valid_targets_min": 3822
},
{
"epoch": 2.5794392523364484,
"grad_norm": 0.4832272367661924,
"learning_rate": 3.186212186651591e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1389496773481369,
"step": 1795,
"valid_targets_mean": 4036.4,
"valid_targets_min": 861
},
{
"epoch": 2.5866283249460817,
"grad_norm": 0.48575809575681733,
"learning_rate": 3.1804350303243175e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.145027756690979,
"step": 1800,
"valid_targets_mean": 4709.1,
"valid_targets_min": 993
},
{
"epoch": 2.593817397555715,
"grad_norm": 0.5342164381090817,
"learning_rate": 3.174642719543262e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14232099056243896,
"step": 1805,
"valid_targets_mean": 4011.2,
"valid_targets_min": 785
},
{
"epoch": 2.601006470165349,
"grad_norm": 0.5409491251603485,
"learning_rate": 3.168835328670252e-05,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15404319763183594,
"step": 1810,
"valid_targets_mean": 4418.6,
"valid_targets_min": 906
},
{
"epoch": 2.608195542774982,
"grad_norm": 0.5368817093148895,
"learning_rate": 3.1630129322607135e-05,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15413588285446167,
"step": 1815,
"valid_targets_mean": 3734.1,
"valid_targets_min": 567
},
{
"epoch": 2.6153846153846154,
"grad_norm": 0.4908534227910792,
"learning_rate": 3.157175605062715e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11011715233325958,
"step": 1820,
"valid_targets_mean": 3284.6,
"valid_targets_min": 545
},
{
"epoch": 2.6225736879942487,
"grad_norm": 0.6400744445531912,
"learning_rate": 3.1513234220160046e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18450883030891418,
"step": 1825,
"valid_targets_mean": 2911.4,
"valid_targets_min": 467
},
{
"epoch": 2.629762760603882,
"grad_norm": 0.47741062151662667,
"learning_rate": 3.145456458251052e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1267721801996231,
"step": 1830,
"valid_targets_mean": 3127.4,
"valid_targets_min": 875
},
{
"epoch": 2.6369518332135153,
"grad_norm": 0.5287490483158872,
"learning_rate": 3.139574789088081e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11356522142887115,
"step": 1835,
"valid_targets_mean": 2696.1,
"valid_targets_min": 661
},
{
"epoch": 2.644140905823149,
"grad_norm": 0.5207652535003496,
"learning_rate": 3.133678490036105e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11317160725593567,
"step": 1840,
"valid_targets_mean": 2998.9,
"valid_targets_min": 551
},
{
"epoch": 2.6513299784327824,
"grad_norm": 0.49826783220149434,
"learning_rate": 3.1277676367919536e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12781062722206116,
"step": 1845,
"valid_targets_mean": 3907.8,
"valid_targets_min": 804
},
{
"epoch": 2.6585190510424157,
"grad_norm": 0.49684271540043673,
"learning_rate": 3.121842305239307e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15386344492435455,
"step": 1850,
"valid_targets_mean": 4322.5,
"valid_targets_min": 515
},
{
"epoch": 2.665708123652049,
"grad_norm": 0.42219428290284244,
"learning_rate": 3.115902571447716e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11060372740030289,
"step": 1855,
"valid_targets_mean": 4049.8,
"valid_targets_min": 790
},
{
"epoch": 2.6728971962616823,
"grad_norm": 0.5333465277393413,
"learning_rate": 3.109948511671628e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15619201958179474,
"step": 1860,
"valid_targets_mean": 3500.9,
"valid_targets_min": 956
},
{
"epoch": 2.6800862688713156,
"grad_norm": 0.5898901842447883,
"learning_rate": 3.103980202349409e-05,
"loss": 0.2684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14231330156326294,
"step": 1865,
"valid_targets_mean": 4065.4,
"valid_targets_min": 937
},
{
"epoch": 2.687275341480949,
"grad_norm": 0.5275929648717342,
"learning_rate": 3.097997720102359e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11855625361204147,
"step": 1870,
"valid_targets_mean": 2870.2,
"valid_targets_min": 906
},
{
"epoch": 2.6944644140905822,
"grad_norm": 0.5322646973037383,
"learning_rate": 3.092001141733731e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1415766030550003,
"step": 1875,
"valid_targets_mean": 3502.4,
"valid_targets_min": 551
},
{
"epoch": 2.7016534867002155,
"grad_norm": 0.4532218793273748,
"learning_rate": 3.085990544227745e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1096867173910141,
"step": 1880,
"valid_targets_mean": 4147.9,
"valid_targets_min": 422
},
{
"epoch": 2.708842559309849,
"grad_norm": 0.49742211703854067,
"learning_rate": 3.079966004748601e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12179790437221527,
"step": 1885,
"valid_targets_mean": 3049.1,
"valid_targets_min": 663
},
{
"epoch": 2.716031631919482,
"grad_norm": 0.5312740695729437,
"learning_rate": 3.073927600639481e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18648596107959747,
"step": 1890,
"valid_targets_mean": 4425.0,
"valid_targets_min": 3644
},
{
"epoch": 2.723220704529116,
"grad_norm": 0.45492540963452555,
"learning_rate": 3.0678754094215654e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12681034207344055,
"step": 1895,
"valid_targets_mean": 4011.2,
"valid_targets_min": 1087
},
{
"epoch": 2.730409777138749,
"grad_norm": 0.5324709930689125,
"learning_rate": 3.061809508793033e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1529749035835266,
"step": 1900,
"valid_targets_mean": 4182.0,
"valid_targets_min": 969
},
{
"epoch": 2.7375988497483825,
"grad_norm": 0.5282988045210955,
"learning_rate": 3.055729976628066e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11237910389900208,
"step": 1905,
"valid_targets_mean": 2708.0,
"valid_targets_min": 600
},
{
"epoch": 2.744787922358016,
"grad_norm": 0.4592623854572585,
"learning_rate": 3.0496368909758448e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14295190572738647,
"step": 1910,
"valid_targets_mean": 4066.2,
"valid_targets_min": 440
},
{
"epoch": 2.751976994967649,
"grad_norm": 0.4288185851911634,
"learning_rate": 3.0435303300595538e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14109700918197632,
"step": 1915,
"valid_targets_mean": 4810.4,
"valid_targets_min": 624
},
{
"epoch": 2.7591660675772824,
"grad_norm": 0.4511482248881237,
"learning_rate": 3.0374103722753704e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11241908371448517,
"step": 1920,
"valid_targets_mean": 3693.0,
"valid_targets_min": 833
},
{
"epoch": 2.7663551401869158,
"grad_norm": 0.4413291911556102,
"learning_rate": 3.0312770961914623e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12785547971725464,
"step": 1925,
"valid_targets_mean": 4205.5,
"valid_targets_min": 615
},
{
"epoch": 2.7735442127965495,
"grad_norm": 0.44230100469185457,
"learning_rate": 3.0251305805469776e-05,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13793818652629852,
"step": 1930,
"valid_targets_mean": 4618.0,
"valid_targets_min": 3914
},
{
"epoch": 2.780733285406183,
"grad_norm": 0.5078636318952374,
"learning_rate": 3.0189709042510345e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1292886734008789,
"step": 1935,
"valid_targets_mean": 2961.2,
"valid_targets_min": 427
},
{
"epoch": 2.787922358015816,
"grad_norm": 0.5115324989698494,
"learning_rate": 3.012798146381709e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15270881354808807,
"step": 1940,
"valid_targets_mean": 3834.8,
"valid_targets_min": 522
},
{
"epoch": 2.7951114306254494,
"grad_norm": 0.4648202628041615,
"learning_rate": 3.0066123861850162e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10922946035861969,
"step": 1945,
"valid_targets_mean": 3411.1,
"valid_targets_min": 858
},
{
"epoch": 2.8023005032350827,
"grad_norm": 0.5272395212940438,
"learning_rate": 3.000413703073898e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12008656561374664,
"step": 1950,
"valid_targets_mean": 2605.2,
"valid_targets_min": 772
},
{
"epoch": 2.809489575844716,
"grad_norm": 0.524615079864663,
"learning_rate": 2.994202176627198e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134141206741333,
"step": 1955,
"valid_targets_mean": 3072.1,
"valid_targets_min": 707
},
{
"epoch": 2.8166786484543493,
"grad_norm": 0.5277222260085981,
"learning_rate": 2.987977886588646e-05,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11295173317193985,
"step": 1960,
"valid_targets_mean": 2585.8,
"valid_targets_min": 456
},
{
"epoch": 2.8238677210639826,
"grad_norm": 0.5327387085151372,
"learning_rate": 2.981740912865829e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11163774132728577,
"step": 1965,
"valid_targets_mean": 2804.4,
"valid_targets_min": 680
},
{
"epoch": 2.831056793673616,
"grad_norm": 0.5286702950441636,
"learning_rate": 2.9754913355291687e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11060294508934021,
"step": 1970,
"valid_targets_mean": 3187.1,
"valid_targets_min": 596
},
{
"epoch": 2.8382458662832493,
"grad_norm": 0.48936639413972866,
"learning_rate": 2.9692292348108913e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14475484192371368,
"step": 1975,
"valid_targets_mean": 3586.5,
"valid_targets_min": 701
},
{
"epoch": 2.8454349388928826,
"grad_norm": 0.41895977374703486,
"learning_rate": 2.9629546911039995e-05,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1372557133436203,
"step": 1980,
"valid_targets_mean": 5150.8,
"valid_targets_min": 4277
},
{
"epoch": 2.8526240115025163,
"grad_norm": 0.4623645207037126,
"learning_rate": 2.9566677849612383e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12075348943471909,
"step": 1985,
"valid_targets_mean": 2770.5,
"valid_targets_min": 531
},
{
"epoch": 2.8598130841121496,
"grad_norm": 0.4547471741235561,
"learning_rate": 2.950368597094063e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12804922461509705,
"step": 1990,
"valid_targets_mean": 4452.6,
"valid_targets_min": 3473
},
{
"epoch": 2.867002156721783,
"grad_norm": 0.5716261379564964,
"learning_rate": 2.9440572083716e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13049060106277466,
"step": 1995,
"valid_targets_mean": 3718.5,
"valid_targets_min": 949
},
{
"epoch": 2.8741912293314162,
"grad_norm": 0.4523003790407094,
"learning_rate": 2.9377336998196147e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13575586676597595,
"step": 2000,
"valid_targets_mean": 3801.2,
"valid_targets_min": 535
},
{
"epoch": 2.8813803019410495,
"grad_norm": 0.5916418462296764,
"learning_rate": 2.931398152619462e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10240516811609268,
"step": 2005,
"valid_targets_mean": 1806.5,
"valid_targets_min": 471
},
{
"epoch": 2.888569374550683,
"grad_norm": 0.5087183669235579,
"learning_rate": 2.925050648107053e-05,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419801115989685,
"step": 2010,
"valid_targets_mean": 3731.9,
"valid_targets_min": 610
},
{
"epoch": 2.895758447160316,
"grad_norm": 0.5450170825216338,
"learning_rate": 2.9186912677718044e-05,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15140527486801147,
"step": 2015,
"valid_targets_mean": 3016.1,
"valid_targets_min": 581
},
{
"epoch": 2.90294751976995,
"grad_norm": 0.5243099796515388,
"learning_rate": 2.912320093255599e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09774617850780487,
"step": 2020,
"valid_targets_mean": 2224.4,
"valid_targets_min": 493
},
{
"epoch": 2.910136592379583,
"grad_norm": 0.4918756856019155,
"learning_rate": 2.9059372063517285e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10992417484521866,
"step": 2025,
"valid_targets_mean": 3224.4,
"valid_targets_min": 594
},
{
"epoch": 2.9173256649892165,
"grad_norm": 0.5043736261289858,
"learning_rate": 2.8995426890038533e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19480252265930176,
"step": 2030,
"valid_targets_mean": 5160.0,
"valid_targets_min": 573
},
{
"epoch": 2.92451473759885,
"grad_norm": 0.4624647860625992,
"learning_rate": 2.8931366233049415e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1291601061820984,
"step": 2035,
"valid_targets_mean": 3699.6,
"valid_targets_min": 758
},
{
"epoch": 2.931703810208483,
"grad_norm": 0.4567936051912573,
"learning_rate": 2.8867190914962228e-05,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1221659928560257,
"step": 2040,
"valid_targets_mean": 3541.9,
"valid_targets_min": 989
},
{
"epoch": 2.9388928828181164,
"grad_norm": 0.5108265761866421,
"learning_rate": 2.8802901759661256e-05,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11455883830785751,
"step": 2045,
"valid_targets_mean": 2693.2,
"valid_targets_min": 574
},
{
"epoch": 2.9460819554277498,
"grad_norm": 0.462539235433949,
"learning_rate": 2.873849959249226e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12773972749710083,
"step": 2050,
"valid_targets_mean": 3324.9,
"valid_targets_min": 688
},
{
"epoch": 2.953271028037383,
"grad_norm": 0.4922307858611935,
"learning_rate": 2.8673985240251835e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15249422192573547,
"step": 2055,
"valid_targets_mean": 4484.2,
"valid_targets_min": 685
},
{
"epoch": 2.9604601006470164,
"grad_norm": 0.5119981885399685,
"learning_rate": 2.860935953117681e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13160674273967743,
"step": 2060,
"valid_targets_mean": 3732.1,
"valid_targets_min": 680
},
{
"epoch": 2.9676491732566497,
"grad_norm": 0.5867234583593739,
"learning_rate": 2.854462329493362e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13651028275489807,
"step": 2065,
"valid_targets_mean": 2434.2,
"valid_targets_min": 840
},
{
"epoch": 2.974838245866283,
"grad_norm": 0.4906003413994672,
"learning_rate": 2.8479777362607647e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14013247191905975,
"step": 2070,
"valid_targets_mean": 3921.0,
"valid_targets_min": 557
},
{
"epoch": 2.9820273184759167,
"grad_norm": 0.5123460997995863,
"learning_rate": 2.8414822566692558e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14255797863006592,
"step": 2075,
"valid_targets_mean": 3564.1,
"valid_targets_min": 751
},
{
"epoch": 2.98921639108555,
"grad_norm": 0.43494582159562417,
"learning_rate": 2.8349759741079607e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11678533256053925,
"step": 2080,
"valid_targets_mean": 4366.4,
"valid_targets_min": 3042
},
{
"epoch": 2.9964054636951833,
"grad_norm": 0.45854822797123423,
"learning_rate": 2.828458972104695e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12588660418987274,
"step": 2085,
"valid_targets_mean": 3966.5,
"valid_targets_min": 595
},
{
"epoch": 3.0028756290438534,
"grad_norm": 0.7069079359730072,
"learning_rate": 2.8219313343248885e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16991043090820312,
"step": 2090,
"valid_targets_mean": 4596.9,
"valid_targets_min": 1041
},
{
"epoch": 3.0100647016534867,
"grad_norm": 0.5545887030564403,
"learning_rate": 2.8153931445705162e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15513832867145538,
"step": 2095,
"valid_targets_mean": 3631.5,
"valid_targets_min": 615
},
{
"epoch": 3.01725377426312,
"grad_norm": 0.508386475491845,
"learning_rate": 2.808844486779016e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13907843828201294,
"step": 2100,
"valid_targets_mean": 3614.2,
"valid_targets_min": 315
},
{
"epoch": 3.0244428468727533,
"grad_norm": 0.5044166011046787,
"learning_rate": 2.8022854450222182e-05,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12767350673675537,
"step": 2105,
"valid_targets_mean": 3602.5,
"valid_targets_min": 690
},
{
"epoch": 3.0316319194823866,
"grad_norm": 0.4597303620877388,
"learning_rate": 2.7957161035052606e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1011454239487648,
"step": 2110,
"valid_targets_mean": 3388.5,
"valid_targets_min": 693
},
{
"epoch": 3.03882099209202,
"grad_norm": 0.5324995493873002,
"learning_rate": 2.789136546565511e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15829084813594818,
"step": 2115,
"valid_targets_mean": 3950.1,
"valid_targets_min": 641
},
{
"epoch": 3.0460100647016537,
"grad_norm": 0.4661168596192042,
"learning_rate": 2.782546858671481e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10927501320838928,
"step": 2120,
"valid_targets_mean": 3423.1,
"valid_targets_min": 830
},
{
"epoch": 3.053199137311287,
"grad_norm": 0.5030757007783364,
"learning_rate": 2.775947124421746e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12120012938976288,
"step": 2125,
"valid_targets_mean": 3486.4,
"valid_targets_min": 730
},
{
"epoch": 3.0603882099209203,
"grad_norm": 0.5093743527850355,
"learning_rate": 2.7693374285438547e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12037092447280884,
"step": 2130,
"valid_targets_mean": 3773.8,
"valid_targets_min": 701
},
{
"epoch": 3.0675772825305536,
"grad_norm": 0.5318422279637071,
"learning_rate": 2.7627178558932456e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12518146634101868,
"step": 2135,
"valid_targets_mean": 2867.9,
"valid_targets_min": 736
},
{
"epoch": 3.074766355140187,
"grad_norm": 0.5495389139214483,
"learning_rate": 2.756088491452153e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17592960596084595,
"step": 2140,
"valid_targets_mean": 5162.5,
"valid_targets_min": 617
},
{
"epoch": 3.0819554277498202,
"grad_norm": 0.5080084657969545,
"learning_rate": 2.749449420328521e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12165935337543488,
"step": 2145,
"valid_targets_mean": 3485.5,
"valid_targets_min": 603
},
{
"epoch": 3.0891445003594535,
"grad_norm": 0.4581974538526893,
"learning_rate": 2.742800727754906e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13358767330646515,
"step": 2150,
"valid_targets_mean": 4797.4,
"valid_targets_min": 629
},
{
"epoch": 3.096333572969087,
"grad_norm": 0.5293145081012333,
"learning_rate": 2.7361424990873864e-05,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12826603651046753,
"step": 2155,
"valid_targets_mean": 3203.6,
"valid_targets_min": 609
},
{
"epoch": 3.10352264557872,
"grad_norm": 0.5045238984815654,
"learning_rate": 2.7294748198044637e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1334061473608017,
"step": 2160,
"valid_targets_mean": 3690.8,
"valid_targets_min": 611
},
{
"epoch": 3.110711718188354,
"grad_norm": 0.5944184962075417,
"learning_rate": 2.722797775505969e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12685522437095642,
"step": 2165,
"valid_targets_mean": 3470.2,
"valid_targets_min": 862
},
{
"epoch": 3.117900790797987,
"grad_norm": 0.5242002429250229,
"learning_rate": 2.7161114519119593e-05,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18032889068126678,
"step": 2170,
"valid_targets_mean": 4346.6,
"valid_targets_min": 567
},
{
"epoch": 3.1250898634076205,
"grad_norm": 0.47519017295660587,
"learning_rate": 2.7094159348616203e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11818739026784897,
"step": 2175,
"valid_targets_mean": 3679.6,
"valid_targets_min": 620
},
{
"epoch": 3.132278936017254,
"grad_norm": 0.5510983437184556,
"learning_rate": 2.702711310312164e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11581596732139587,
"step": 2180,
"valid_targets_mean": 3518.8,
"valid_targets_min": 653
},
{
"epoch": 3.139468008626887,
"grad_norm": 0.46201415582633937,
"learning_rate": 2.6959976643377238e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1287374198436737,
"step": 2185,
"valid_targets_mean": 4390.4,
"valid_targets_min": 854
},
{
"epoch": 3.1466570812365204,
"grad_norm": 0.49096146703639676,
"learning_rate": 2.689275083128252e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12094248831272125,
"step": 2190,
"valid_targets_mean": 3696.8,
"valid_targets_min": 368
},
{
"epoch": 3.1538461538461537,
"grad_norm": 0.4994916178852232,
"learning_rate": 2.6825436529884094e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11061419546604156,
"step": 2195,
"valid_targets_mean": 3000.4,
"valid_targets_min": 514
},
{
"epoch": 3.161035226455787,
"grad_norm": 0.5036089659495702,
"learning_rate": 2.6758034603364608e-05,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11006475985050201,
"step": 2200,
"valid_targets_mean": 3325.2,
"valid_targets_min": 723
},
{
"epoch": 3.1682242990654204,
"grad_norm": 0.47055905502722695,
"learning_rate": 2.669054591703165e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12930098176002502,
"step": 2205,
"valid_targets_mean": 4341.8,
"valid_targets_min": 938
},
{
"epoch": 3.175413371675054,
"grad_norm": 0.608692174157198,
"learning_rate": 2.6622971337306625e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09900519251823425,
"step": 2210,
"valid_targets_mean": 1953.5,
"valid_targets_min": 484
},
{
"epoch": 3.1826024442846874,
"grad_norm": 0.47784907638231894,
"learning_rate": 2.6555311731713626e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12810474634170532,
"step": 2215,
"valid_targets_mean": 3757.8,
"valid_targets_min": 758
},
{
"epoch": 3.1897915168943207,
"grad_norm": 0.5130577267818007,
"learning_rate": 2.6487567968868347e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12371031194925308,
"step": 2220,
"valid_targets_mean": 3631.8,
"valid_targets_min": 504
},
{
"epoch": 3.196980589503954,
"grad_norm": 0.4808527638754144,
"learning_rate": 2.6419740918466844e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09714284539222717,
"step": 2225,
"valid_targets_mean": 3717.6,
"valid_targets_min": 586
},
{
"epoch": 3.2041696621135873,
"grad_norm": 0.5518930760729734,
"learning_rate": 2.6351831451274477e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11862578988075256,
"step": 2230,
"valid_targets_mean": 2508.8,
"valid_targets_min": 468
},
{
"epoch": 3.2113587347232206,
"grad_norm": 0.4940521060256115,
"learning_rate": 2.628384043911462e-05,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13668888807296753,
"step": 2235,
"valid_targets_mean": 4032.0,
"valid_targets_min": 891
},
{
"epoch": 3.218547807332854,
"grad_norm": 0.5034504739886473,
"learning_rate": 2.621576875485757e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1095261424779892,
"step": 2240,
"valid_targets_mean": 3305.0,
"valid_targets_min": 573
},
{
"epoch": 3.2257368799424873,
"grad_norm": 0.43830856076779845,
"learning_rate": 2.6147617272409255e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12325970083475113,
"step": 2245,
"valid_targets_mean": 4494.5,
"valid_targets_min": 916
},
{
"epoch": 3.2329259525521206,
"grad_norm": 0.47839573422386605,
"learning_rate": 2.6079386866700095e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1166163831949234,
"step": 2250,
"valid_targets_mean": 3777.6,
"valid_targets_min": 580
},
{
"epoch": 3.2401150251617543,
"grad_norm": 0.4602584782158853,
"learning_rate": 2.6011078413673692e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12046687304973602,
"step": 2255,
"valid_targets_mean": 4617.8,
"valid_targets_min": 3984
},
{
"epoch": 3.2473040977713876,
"grad_norm": 0.4655312917452448,
"learning_rate": 2.594269279027564e-05,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12522590160369873,
"step": 2260,
"valid_targets_mean": 4336.1,
"valid_targets_min": 762
},
{
"epoch": 3.254493170381021,
"grad_norm": 0.48726149453285067,
"learning_rate": 2.5874230874442238e-05,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15026704967021942,
"step": 2265,
"valid_targets_mean": 4303.4,
"valid_targets_min": 895
},
{
"epoch": 3.2616822429906542,
"grad_norm": 0.6304249424929381,
"learning_rate": 2.580569354508925e-05,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13789577782154083,
"step": 2270,
"valid_targets_mean": 2981.5,
"valid_targets_min": 639
},
{
"epoch": 3.2688713156002875,
"grad_norm": 0.6086760431353105,
"learning_rate": 2.5737081682100575e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10886932909488678,
"step": 2275,
"valid_targets_mean": 1702.2,
"valid_targets_min": 579
},
{
"epoch": 3.276060388209921,
"grad_norm": 0.45586872184556493,
"learning_rate": 2.5668396166316988e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1350633203983307,
"step": 2280,
"valid_targets_mean": 5057.0,
"valid_targets_min": 3466
},
{
"epoch": 3.283249460819554,
"grad_norm": 0.461465009195521,
"learning_rate": 2.5599637879524822e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12891460955142975,
"step": 2285,
"valid_targets_mean": 3825.4,
"valid_targets_min": 636
},
{
"epoch": 3.2904385334291875,
"grad_norm": 0.4806164913168704,
"learning_rate": 2.5530807704444646e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10771054029464722,
"step": 2290,
"valid_targets_mean": 4006.0,
"valid_targets_min": 665
},
{
"epoch": 3.297627606038821,
"grad_norm": 0.5441576056359098,
"learning_rate": 2.5461906524719927e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12522868812084198,
"step": 2295,
"valid_targets_mean": 3343.1,
"valid_targets_min": 705
},
{
"epoch": 3.3048166786484545,
"grad_norm": 0.5946930017526083,
"learning_rate": 2.539293522490569e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1276351809501648,
"step": 2300,
"valid_targets_mean": 2709.4,
"valid_targets_min": 639
},
{
"epoch": 3.312005751258088,
"grad_norm": 0.4879292674456743,
"learning_rate": 2.5323894690457186e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12799575924873352,
"step": 2305,
"valid_targets_mean": 3353.2,
"valid_targets_min": 609
},
{
"epoch": 3.319194823867721,
"grad_norm": 0.42910242310010305,
"learning_rate": 2.525478580771847e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10297475755214691,
"step": 2310,
"valid_targets_mean": 4044.0,
"valid_targets_min": 258
},
{
"epoch": 3.3263838964773544,
"grad_norm": 0.5347387405067475,
"learning_rate": 2.5185609463911068e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12474454939365387,
"step": 2315,
"valid_targets_mean": 4503.6,
"valid_targets_min": 3153
},
{
"epoch": 3.3335729690869877,
"grad_norm": 0.4700670848022084,
"learning_rate": 2.511636654712258e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10849539190530777,
"step": 2320,
"valid_targets_mean": 3746.0,
"valid_targets_min": 684
},
{
"epoch": 3.340762041696621,
"grad_norm": 0.4835583524848898,
"learning_rate": 2.5047057946295263e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440524011850357,
"step": 2325,
"valid_targets_mean": 4286.1,
"valid_targets_min": 451
},
{
"epoch": 3.3479511143062544,
"grad_norm": 0.6506238528935938,
"learning_rate": 2.4977684551214628e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1264440417289734,
"step": 2330,
"valid_targets_mean": 3910.2,
"valid_targets_min": 551
},
{
"epoch": 3.3551401869158877,
"grad_norm": 0.5480561132118623,
"learning_rate": 2.4908247252498016e-05,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12950649857521057,
"step": 2335,
"valid_targets_mean": 2837.0,
"valid_targets_min": 724
},
{
"epoch": 3.362329259525521,
"grad_norm": 0.447018910737458,
"learning_rate": 2.4838746941583165e-05,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10450244694948196,
"step": 2340,
"valid_targets_mean": 3569.1,
"valid_targets_min": 791
},
{
"epoch": 3.3695183321351547,
"grad_norm": 0.5293944991502482,
"learning_rate": 2.476918451071677e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15744715929031372,
"step": 2345,
"valid_targets_mean": 4600.1,
"valid_targets_min": 827
},
{
"epoch": 3.376707404744788,
"grad_norm": 0.5794346987479623,
"learning_rate": 2.4699560852943015e-05,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10630621761083603,
"step": 2350,
"valid_targets_mean": 2537.6,
"valid_targets_min": 591
},
{
"epoch": 3.3838964773544213,
"grad_norm": 0.567018449508628,
"learning_rate": 2.4629876862092123e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13535767793655396,
"step": 2355,
"valid_targets_mean": 3689.2,
"valid_targets_min": 646
},
{
"epoch": 3.3910855499640546,
"grad_norm": 0.49820742830571135,
"learning_rate": 2.4560133432768868e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11119614541530609,
"step": 2360,
"valid_targets_mean": 3304.4,
"valid_targets_min": 594
},
{
"epoch": 3.398274622573688,
"grad_norm": 0.4797249357815499,
"learning_rate": 2.4490331460341112e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10317108780145645,
"step": 2365,
"valid_targets_mean": 3439.0,
"valid_targets_min": 619
},
{
"epoch": 3.4054636951833213,
"grad_norm": 0.5444831821184157,
"learning_rate": 2.442047184092827e-05,
"loss": 0.2493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11617874354124069,
"step": 2370,
"valid_targets_mean": 3076.0,
"valid_targets_min": 492
},
{
"epoch": 3.4126527677929546,
"grad_norm": 0.5107430646256917,
"learning_rate": 2.435055547138986e-05,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.124700166285038,
"step": 2375,
"valid_targets_mean": 3625.1,
"valid_targets_min": 598
},
{
"epoch": 3.419841840402588,
"grad_norm": 0.5189568720557954,
"learning_rate": 2.4280583249313925e-05,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14366132020950317,
"step": 2380,
"valid_targets_mean": 4110.0,
"valid_targets_min": 610
},
{
"epoch": 3.4270309130122216,
"grad_norm": 0.5341482929308659,
"learning_rate": 2.4210556073005574e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.141306534409523,
"step": 2385,
"valid_targets_mean": 3757.0,
"valid_targets_min": 628
},
{
"epoch": 3.434219985621855,
"grad_norm": 0.48115635467476825,
"learning_rate": 2.4140474841475414e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12492194771766663,
"step": 2390,
"valid_targets_mean": 4349.9,
"valid_targets_min": 3705
},
{
"epoch": 3.4414090582314882,
"grad_norm": 0.48336377937661607,
"learning_rate": 2.4070340454427997e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1366448700428009,
"step": 2395,
"valid_targets_mean": 3848.9,
"valid_targets_min": 634
},
{
"epoch": 3.4485981308411215,
"grad_norm": 0.5304216588904245,
"learning_rate": 2.4000153812250307e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11717712134122849,
"step": 2400,
"valid_targets_mean": 2570.8,
"valid_targets_min": 647
},
{
"epoch": 3.455787203450755,
"grad_norm": 0.6855077706341426,
"learning_rate": 2.3929915816000168e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15973010659217834,
"step": 2405,
"valid_targets_mean": 3849.2,
"valid_targets_min": 810
},
{
"epoch": 3.462976276060388,
"grad_norm": 0.540313346399356,
"learning_rate": 2.3859627367394688e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1391582190990448,
"step": 2410,
"valid_targets_mean": 3065.8,
"valid_targets_min": 635
},
{
"epoch": 3.4701653486700215,
"grad_norm": 0.49233214084773025,
"learning_rate": 2.3789289368798697e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14611698687076569,
"step": 2415,
"valid_targets_mean": 4553.0,
"valid_targets_min": 978
},
{
"epoch": 3.4773544212796548,
"grad_norm": 0.4898159022933566,
"learning_rate": 2.3718902723213142e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13121764361858368,
"step": 2420,
"valid_targets_mean": 4073.2,
"valid_targets_min": 632
},
{
"epoch": 3.484543493889288,
"grad_norm": 0.5398527086062614,
"learning_rate": 2.3648468334263495e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375160962343216,
"step": 2425,
"valid_targets_mean": 3811.4,
"valid_targets_min": 765
},
{
"epoch": 3.491732566498922,
"grad_norm": 0.4501147730461357,
"learning_rate": 2.357798710618817e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1265125274658203,
"step": 2430,
"valid_targets_mean": 4631.2,
"valid_targets_min": 3903
},
{
"epoch": 3.498921639108555,
"grad_norm": 0.4518210089516425,
"learning_rate": 2.3507459943826888e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13443484902381897,
"step": 2435,
"valid_targets_mean": 4459.2,
"valid_targets_min": 920
},
{
"epoch": 3.5061107117181884,
"grad_norm": 0.46454350403949213,
"learning_rate": 2.343688775260909e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10301059484481812,
"step": 2440,
"valid_targets_mean": 3593.6,
"valid_targets_min": 615
},
{
"epoch": 3.5132997843278218,
"grad_norm": 0.49423402003357275,
"learning_rate": 2.3366271438542287e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09725943207740784,
"step": 2445,
"valid_targets_mean": 3318.4,
"valid_targets_min": 649
},
{
"epoch": 3.520488856937455,
"grad_norm": 0.47637389226364873,
"learning_rate": 2.3295611908200454e-05,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10003632307052612,
"step": 2450,
"valid_targets_mean": 3680.4,
"valid_targets_min": 709
},
{
"epoch": 3.5276779295470884,
"grad_norm": 0.4918339024950877,
"learning_rate": 2.3224910068712355e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.126363143324852,
"step": 2455,
"valid_targets_mean": 3840.5,
"valid_targets_min": 576
},
{
"epoch": 3.5348670021567217,
"grad_norm": 0.5921138868050676,
"learning_rate": 2.3154166827749947e-05,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11931576579809189,
"step": 2460,
"valid_targets_mean": 2681.2,
"valid_targets_min": 732
},
{
"epoch": 3.542056074766355,
"grad_norm": 0.6086195584987955,
"learning_rate": 2.3083383093516686e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12224029749631882,
"step": 2465,
"valid_targets_mean": 3808.8,
"valid_targets_min": 787
},
{
"epoch": 3.5492451473759887,
"grad_norm": 0.5021142253817824,
"learning_rate": 2.301255977473587e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11519993841648102,
"step": 2470,
"valid_targets_mean": 3547.0,
"valid_targets_min": 693
},
{
"epoch": 3.556434219985622,
"grad_norm": 0.504249898299747,
"learning_rate": 2.2941697780639018e-05,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11413753032684326,
"step": 2475,
"valid_targets_mean": 3386.0,
"valid_targets_min": 713
},
{
"epoch": 3.5636232925952553,
"grad_norm": 0.5258515811866988,
"learning_rate": 2.2870798020954127e-05,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09162728488445282,
"step": 2480,
"valid_targets_mean": 2764.0,
"valid_targets_min": 563
},
{
"epoch": 3.5708123652048886,
"grad_norm": 0.45667405800785726,
"learning_rate": 2.279986140589405e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14917941391468048,
"step": 2485,
"valid_targets_mean": 4933.5,
"valid_targets_min": 693
},
{
"epoch": 3.578001437814522,
"grad_norm": 0.47014637028947304,
"learning_rate": 2.2728888846144788e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12864919006824493,
"step": 2490,
"valid_targets_mean": 4165.1,
"valid_targets_min": 752
},
{
"epoch": 3.5851905104241553,
"grad_norm": 0.5232237334052633,
"learning_rate": 2.2657881252853792e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11721894145011902,
"step": 2495,
"valid_targets_mean": 3049.2,
"valid_targets_min": 618
},
{
"epoch": 3.5923795830337886,
"grad_norm": 0.48021599807423754,
"learning_rate": 2.2586839537618285e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10148143023252487,
"step": 2500,
"valid_targets_mean": 3688.9,
"valid_targets_min": 525
},
{
"epoch": 3.599568655643422,
"grad_norm": 0.4923060580408922,
"learning_rate": 2.2515764612473553e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10971393436193466,
"step": 2505,
"valid_targets_mean": 3988.9,
"valid_targets_min": 634
},
{
"epoch": 3.606757728253055,
"grad_norm": 0.6862438146632643,
"learning_rate": 2.2444657389881203e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11502759903669357,
"step": 2510,
"valid_targets_mean": 2437.4,
"valid_targets_min": 502
},
{
"epoch": 3.6139468008626885,
"grad_norm": 0.57899984231831,
"learning_rate": 2.2373518782717513e-05,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13824304938316345,
"step": 2515,
"valid_targets_mean": 4252.1,
"valid_targets_min": 611
},
{
"epoch": 3.621135873472322,
"grad_norm": 0.47585894131516004,
"learning_rate": 2.2302349704261657e-05,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1324179470539093,
"step": 2520,
"valid_targets_mean": 4517.6,
"valid_targets_min": 601
},
{
"epoch": 3.6283249460819555,
"grad_norm": 0.41528620994981147,
"learning_rate": 2.2231151068184005e-05,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1042901873588562,
"step": 2525,
"valid_targets_mean": 4695.5,
"valid_targets_min": 3257
},
{
"epoch": 3.635514018691589,
"grad_norm": 0.5069891883936893,
"learning_rate": 2.2159923788534383e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1232769638299942,
"step": 2530,
"valid_targets_mean": 3207.2,
"valid_targets_min": 652
},
{
"epoch": 3.642703091301222,
"grad_norm": 0.43169111980404523,
"learning_rate": 2.2088668779730352e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11891108006238937,
"step": 2535,
"valid_targets_mean": 4488.8,
"valid_targets_min": 933
},
{
"epoch": 3.6498921639108555,
"grad_norm": 0.53035855657901,
"learning_rate": 2.201738695654546e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12702947854995728,
"step": 2540,
"valid_targets_mean": 3401.8,
"valid_targets_min": 1101
},
{
"epoch": 3.6570812365204888,
"grad_norm": 0.8015662534418149,
"learning_rate": 2.1946079234097497e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13921813666820526,
"step": 2545,
"valid_targets_mean": 4335.4,
"valid_targets_min": 769
},
{
"epoch": 3.664270309130122,
"grad_norm": 0.529734503659625,
"learning_rate": 2.1874746527836738e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11016402393579483,
"step": 2550,
"valid_targets_mean": 2528.5,
"valid_targets_min": 759
},
{
"epoch": 3.671459381739756,
"grad_norm": 0.6001197865922718,
"learning_rate": 2.180338975353422e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12066247314214706,
"step": 2555,
"valid_targets_mean": 2506.1,
"valid_targets_min": 542
},
{
"epoch": 3.678648454349389,
"grad_norm": 0.46689109296603837,
"learning_rate": 2.1732009827269947e-05,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11004269123077393,
"step": 2560,
"valid_targets_mean": 3788.0,
"valid_targets_min": 833
},
{
"epoch": 3.6858375269590224,
"grad_norm": 0.46412325094131973,
"learning_rate": 2.166060766542117e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13252490758895874,
"step": 2565,
"valid_targets_mean": 4282.9,
"valid_targets_min": 965
},
{
"epoch": 3.6930265995686558,
"grad_norm": 0.5207990273092182,
"learning_rate": 2.1589184184650573e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0916057825088501,
"step": 2570,
"valid_targets_mean": 2747.2,
"valid_targets_min": 344
},
{
"epoch": 3.700215672178289,
"grad_norm": 0.5296101459863599,
"learning_rate": 2.1517740301894565e-05,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09578610211610794,
"step": 2575,
"valid_targets_mean": 2223.9,
"valid_targets_min": 421
},
{
"epoch": 3.7074047447879224,
"grad_norm": 0.5337544782692388,
"learning_rate": 2.144627693435145e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1551215648651123,
"step": 2580,
"valid_targets_mean": 3619.0,
"valid_targets_min": 630
},
{
"epoch": 3.7145938173975557,
"grad_norm": 0.46977810033457923,
"learning_rate": 2.1374794999469683e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11778691411018372,
"step": 2585,
"valid_targets_mean": 4017.2,
"valid_targets_min": 569
},
{
"epoch": 3.721782890007189,
"grad_norm": 0.5369932341533742,
"learning_rate": 2.1303295414936104e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18012884259223938,
"step": 2590,
"valid_targets_mean": 4391.9,
"valid_targets_min": 743
},
{
"epoch": 3.7289719626168223,
"grad_norm": 0.5299860172850779,
"learning_rate": 2.1231779098664117e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13819974660873413,
"step": 2595,
"valid_targets_mean": 3378.9,
"valid_targets_min": 652
},
{
"epoch": 3.7361610352264556,
"grad_norm": 0.5258708261765481,
"learning_rate": 2.1160246968781946e-05,
"loss": 0.2663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1301390379667282,
"step": 2600,
"valid_targets_mean": 3329.5,
"valid_targets_min": 678
},
{
"epoch": 3.743350107836089,
"grad_norm": 0.4743676812927684,
"learning_rate": 2.1088699943620827e-05,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1157599464058876,
"step": 2605,
"valid_targets_mean": 3933.9,
"valid_targets_min": 621
},
{
"epoch": 3.7505391804457227,
"grad_norm": 0.5364161202382962,
"learning_rate": 2.1017138941703204e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12845493853092194,
"step": 2610,
"valid_targets_mean": 3678.6,
"valid_targets_min": 405
},
{
"epoch": 3.757728253055356,
"grad_norm": 0.46482943852345554,
"learning_rate": 2.094556488173098e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1247505247592926,
"step": 2615,
"valid_targets_mean": 3829.6,
"valid_targets_min": 812
},
{
"epoch": 3.7649173256649893,
"grad_norm": 0.508770935066309,
"learning_rate": 2.0873978682573684e-05,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15090303122997284,
"step": 2620,
"valid_targets_mean": 4160.5,
"valid_targets_min": 686
},
{
"epoch": 3.7721063982746226,
"grad_norm": 0.493041194796532,
"learning_rate": 2.0802381263256695e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14253270626068115,
"step": 2625,
"valid_targets_mean": 3882.0,
"valid_targets_min": 882
},
{
"epoch": 3.779295470884256,
"grad_norm": 0.4917977926190101,
"learning_rate": 2.0730773542949428e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1122705489397049,
"step": 2630,
"valid_targets_mean": 3226.6,
"valid_targets_min": 540
},
{
"epoch": 3.786484543493889,
"grad_norm": 0.4820507926987514,
"learning_rate": 2.0659156440953548e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09798593819141388,
"step": 2635,
"valid_targets_mean": 2979.9,
"valid_targets_min": 700
},
{
"epoch": 3.7936736161035225,
"grad_norm": 0.5465128709652923,
"learning_rate": 2.058753087669117e-05,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12692230939865112,
"step": 2640,
"valid_targets_mean": 3353.5,
"valid_targets_min": 643
},
{
"epoch": 3.8008626887131562,
"grad_norm": 0.47851627989550993,
"learning_rate": 2.0515897769693015e-05,
"loss": 0.2472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14869645237922668,
"step": 2645,
"valid_targets_mean": 4664.6,
"valid_targets_min": 757
},
{
"epoch": 3.8080517613227896,
"grad_norm": 0.42380667956671314,
"learning_rate": 2.044425803958669e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11933261156082153,
"step": 2650,
"valid_targets_mean": 4663.6,
"valid_targets_min": 3223
},
{
"epoch": 3.815240833932423,
"grad_norm": 0.4795587784552931,
"learning_rate": 2.0372612606084784e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1432308852672577,
"step": 2655,
"valid_targets_mean": 3894.0,
"valid_targets_min": 812
},
{
"epoch": 3.822429906542056,
"grad_norm": 0.5626384295877633,
"learning_rate": 2.030096238897314e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16091012954711914,
"step": 2660,
"valid_targets_mean": 3704.8,
"valid_targets_min": 533
},
{
"epoch": 3.8296189791516895,
"grad_norm": 0.8151561380660051,
"learning_rate": 2.022930830809898e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18149186670780182,
"step": 2665,
"valid_targets_mean": 4656.2,
"valid_targets_min": 821
},
{
"epoch": 3.836808051761323,
"grad_norm": 0.4453347518556729,
"learning_rate": 2.015765128335916e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12284523248672485,
"step": 2670,
"valid_targets_mean": 4547.9,
"valid_targets_min": 565
},
{
"epoch": 3.843997124370956,
"grad_norm": 0.43116833253695513,
"learning_rate": 2.0085992234688305e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14145714044570923,
"step": 2675,
"valid_targets_mean": 4979.5,
"valid_targets_min": 3802
},
{
"epoch": 3.8511861969805894,
"grad_norm": 0.5595435853648367,
"learning_rate": 2.0014332082047043e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10264123976230621,
"step": 2680,
"valid_targets_mean": 2736.0,
"valid_targets_min": 690
},
{
"epoch": 3.8583752695902227,
"grad_norm": 0.48529338510837766,
"learning_rate": 1.994267174541015e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1485181450843811,
"step": 2685,
"valid_targets_mean": 3982.6,
"valid_targets_min": 579
},
{
"epoch": 3.865564342199856,
"grad_norm": 0.549946831719716,
"learning_rate": 1.9871012144754803e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11590389907360077,
"step": 2690,
"valid_targets_mean": 3149.9,
"valid_targets_min": 576
},
{
"epoch": 3.8727534148094893,
"grad_norm": 0.5228093621705135,
"learning_rate": 1.9799354200048687e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08893737196922302,
"step": 2695,
"valid_targets_mean": 3057.0,
"valid_targets_min": 730
},
{
"epoch": 3.879942487419123,
"grad_norm": 0.530256928414435,
"learning_rate": 1.9727698831238265e-05,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14026793837547302,
"step": 2700,
"valid_targets_mean": 3831.9,
"valid_targets_min": 648
},
{
"epoch": 3.8871315600287564,
"grad_norm": 0.4793247139706527,
"learning_rate": 1.96560469582369e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12756478786468506,
"step": 2705,
"valid_targets_mean": 4601.4,
"valid_targets_min": 666
},
{
"epoch": 3.8943206326383897,
"grad_norm": 0.5375220032845645,
"learning_rate": 1.9584399500913102e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13013246655464172,
"step": 2710,
"valid_targets_mean": 2996.8,
"valid_targets_min": 485
},
{
"epoch": 3.901509705248023,
"grad_norm": 0.5200980131239384,
"learning_rate": 1.9512757379078665e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1247069388628006,
"step": 2715,
"valid_targets_mean": 3445.8,
"valid_targets_min": 618
},
{
"epoch": 3.9086987778576563,
"grad_norm": 0.4778551860033752,
"learning_rate": 1.9441121512476912e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1516200453042984,
"step": 2720,
"valid_targets_mean": 4454.6,
"valid_targets_min": 551
},
{
"epoch": 3.9158878504672896,
"grad_norm": 0.5198990277474976,
"learning_rate": 1.9369492820770846e-05,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12661394476890564,
"step": 2725,
"valid_targets_mean": 3578.6,
"valid_targets_min": 910
},
{
"epoch": 3.9230769230769234,
"grad_norm": 1.2379830764042923,
"learning_rate": 1.9297872223531358e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10750366747379303,
"step": 2730,
"valid_targets_mean": 2653.1,
"valid_targets_min": 503
},
{
"epoch": 3.9302659956865567,
"grad_norm": 0.45535127246041973,
"learning_rate": 1.922626064022544e-05,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12956029176712036,
"step": 2735,
"valid_targets_mean": 5278.4,
"valid_targets_min": 998
},
{
"epoch": 3.93745506829619,
"grad_norm": 0.5503012132360744,
"learning_rate": 1.9154658990204338e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14677077531814575,
"step": 2740,
"valid_targets_mean": 2994.5,
"valid_targets_min": 635
},
{
"epoch": 3.9446441409058233,
"grad_norm": 0.521779712095191,
"learning_rate": 1.9083068192691792e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10208123177289963,
"step": 2745,
"valid_targets_mean": 2528.6,
"valid_targets_min": 767
},
{
"epoch": 3.9518332135154566,
"grad_norm": 0.5576470665601292,
"learning_rate": 1.9011489166772204e-05,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1775783747434616,
"step": 2750,
"valid_targets_mean": 4281.1,
"valid_targets_min": 656
},
{
"epoch": 3.95902228612509,
"grad_norm": 0.5764471708270146,
"learning_rate": 1.8939922831378865e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09720412641763687,
"step": 2755,
"valid_targets_mean": 2658.6,
"valid_targets_min": 721
},
{
"epoch": 3.966211358734723,
"grad_norm": 0.4811282846227278,
"learning_rate": 1.8868370105282135e-05,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10778206586837769,
"step": 2760,
"valid_targets_mean": 3013.0,
"valid_targets_min": 735
},
{
"epoch": 3.9734004313443565,
"grad_norm": 0.4976074155858476,
"learning_rate": 1.8796831907077664e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1072898805141449,
"step": 2765,
"valid_targets_mean": 2946.6,
"valid_targets_min": 596
},
{
"epoch": 3.98058950395399,
"grad_norm": 0.46716125855521695,
"learning_rate": 1.8725309155174586e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1110248863697052,
"step": 2770,
"valid_targets_mean": 3359.4,
"valid_targets_min": 876
},
{
"epoch": 3.987778576563623,
"grad_norm": 0.4514491824659271,
"learning_rate": 1.8653802767783745e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11654454469680786,
"step": 2775,
"valid_targets_mean": 4018.5,
"valid_targets_min": 2968
},
{
"epoch": 3.9949676491732564,
"grad_norm": 0.5225982018438619,
"learning_rate": 1.858231366290588e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0763361006975174,
"step": 2780,
"valid_targets_mean": 2114.1,
"valid_targets_min": 756
},
{
"epoch": 4.0014378145219265,
"grad_norm": 0.45800317656753836,
"learning_rate": 1.851084275831987e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12621906399726868,
"step": 2785,
"valid_targets_mean": 3660.4,
"valid_targets_min": 715
},
{
"epoch": 4.00862688713156,
"grad_norm": 0.4664591476372027,
"learning_rate": 1.8439390971570945e-05,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13776497542858124,
"step": 2790,
"valid_targets_mean": 4713.0,
"valid_targets_min": 601
},
{
"epoch": 4.015815959741193,
"grad_norm": 0.4389595253807518,
"learning_rate": 1.836795921995889e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08556051552295685,
"step": 2795,
"valid_targets_mean": 4176.5,
"valid_targets_min": 3879
},
{
"epoch": 4.023005032350826,
"grad_norm": 0.5259882713055396,
"learning_rate": 1.829654842052627e-05,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10955113172531128,
"step": 2800,
"valid_targets_mean": 3373.2,
"valid_targets_min": 587
},
{
"epoch": 4.03019410496046,
"grad_norm": 0.4907017624215909,
"learning_rate": 1.8225159490046677e-05,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09427815675735474,
"step": 2805,
"valid_targets_mean": 2864.4,
"valid_targets_min": 473
},
{
"epoch": 4.037383177570093,
"grad_norm": 0.5215374767845408,
"learning_rate": 1.8153793345012948e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15280203521251678,
"step": 2810,
"valid_targets_mean": 4268.6,
"valid_targets_min": 761
},
{
"epoch": 4.044572250179727,
"grad_norm": 0.5415288675373113,
"learning_rate": 1.8082450901625398e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1138095110654831,
"step": 2815,
"valid_targets_mean": 2448.5,
"valid_targets_min": 556
},
{
"epoch": 4.0517613227893605,
"grad_norm": 0.5781808878438677,
"learning_rate": 1.8011133075780055e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13912703096866608,
"step": 2820,
"valid_targets_mean": 3542.9,
"valid_targets_min": 639
},
{
"epoch": 4.058950395398994,
"grad_norm": 0.5703158966366867,
"learning_rate": 1.7939840783056918e-05,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1219850406050682,
"step": 2825,
"valid_targets_mean": 3617.2,
"valid_targets_min": 597
},
{
"epoch": 4.066139468008627,
"grad_norm": 0.47744619786924974,
"learning_rate": 1.7868574938708173e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13453617691993713,
"step": 2830,
"valid_targets_mean": 4905.6,
"valid_targets_min": 4107
},
{
"epoch": 4.07332854061826,
"grad_norm": 0.5329830970965606,
"learning_rate": 1.779733645764649e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14756852388381958,
"step": 2835,
"valid_targets_mean": 3957.4,
"valid_targets_min": 682
},
{
"epoch": 4.080517613227894,
"grad_norm": 0.5576027992717706,
"learning_rate": 1.772612625443321e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1192103773355484,
"step": 2840,
"valid_targets_mean": 2559.9,
"valid_targets_min": 759
},
{
"epoch": 4.087706685837527,
"grad_norm": 0.5100156431566057,
"learning_rate": 1.7654945243266676e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08618389070034027,
"step": 2845,
"valid_targets_mean": 3077.9,
"valid_targets_min": 568
},
{
"epoch": 4.09489575844716,
"grad_norm": 0.5340345118577982,
"learning_rate": 1.7583794337970452e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14345303177833557,
"step": 2850,
"valid_targets_mean": 4346.1,
"valid_targets_min": 1311
},
{
"epoch": 4.102084831056794,
"grad_norm": 0.4751066918549571,
"learning_rate": 1.751267445198159e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11668483912944794,
"step": 2855,
"valid_targets_mean": 4779.1,
"valid_targets_min": 3563
},
{
"epoch": 4.109273903666427,
"grad_norm": 0.5336703193480168,
"learning_rate": 1.7441586498338933e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12484841048717499,
"step": 2860,
"valid_targets_mean": 3494.9,
"valid_targets_min": 640
},
{
"epoch": 4.11646297627606,
"grad_norm": 0.5501336623672213,
"learning_rate": 1.7370531389671362e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14683029055595398,
"step": 2865,
"valid_targets_mean": 3951.5,
"valid_targets_min": 1163
},
{
"epoch": 4.123652048885694,
"grad_norm": 0.4575645222074036,
"learning_rate": 1.7299510038186105e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12655046582221985,
"step": 2870,
"valid_targets_mean": 4511.2,
"valid_targets_min": 664
},
{
"epoch": 4.130841121495327,
"grad_norm": 0.4774593976400927,
"learning_rate": 1.7228523355657007e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09447678923606873,
"step": 2875,
"valid_targets_mean": 3125.4,
"valid_targets_min": 681
},
{
"epoch": 4.13803019410496,
"grad_norm": 0.5194608985400685,
"learning_rate": 1.7157572253412837e-05,
"loss": 0.2343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12980666756629944,
"step": 2880,
"valid_targets_mean": 3581.4,
"valid_targets_min": 742
},
{
"epoch": 4.1452192667145935,
"grad_norm": 0.509774077422665,
"learning_rate": 1.7086657642325568e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13197895884513855,
"step": 2885,
"valid_targets_mean": 4029.1,
"valid_targets_min": 861
},
{
"epoch": 4.152408339324227,
"grad_norm": 0.5297749408912853,
"learning_rate": 1.7015780432798727e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09195668995380402,
"step": 2890,
"valid_targets_mean": 2926.8,
"valid_targets_min": 664
},
{
"epoch": 4.15959741193386,
"grad_norm": 0.5090609267845478,
"learning_rate": 1.694494153475565e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09950702637434006,
"step": 2895,
"valid_targets_mean": 3153.4,
"valid_targets_min": 257
},
{
"epoch": 4.166786484543494,
"grad_norm": 0.5818668202631337,
"learning_rate": 1.6874141857627846e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1345033049583435,
"step": 2900,
"valid_targets_mean": 3743.4,
"valid_targets_min": 651
},
{
"epoch": 4.173975557153128,
"grad_norm": 0.5817354875875417,
"learning_rate": 1.6803382310343307e-05,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12657590210437775,
"step": 2905,
"valid_targets_mean": 2877.4,
"valid_targets_min": 537
},
{
"epoch": 4.181164629762761,
"grad_norm": 0.5317207649090678,
"learning_rate": 1.6732663801314827e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10397838056087494,
"step": 2910,
"valid_targets_mean": 2906.8,
"valid_targets_min": 683
},
{
"epoch": 4.188353702372394,
"grad_norm": 0.535580648009678,
"learning_rate": 1.6661987238428355e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1221417486667633,
"step": 2915,
"valid_targets_mean": 3189.6,
"valid_targets_min": 670
},
{
"epoch": 4.1955427749820275,
"grad_norm": 0.5363296910044444,
"learning_rate": 1.6591353529031334e-05,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11720272898674011,
"step": 2920,
"valid_targets_mean": 3409.9,
"valid_targets_min": 647
},
{
"epoch": 4.202731847591661,
"grad_norm": 0.5406261463557596,
"learning_rate": 1.6520763579921048e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11183007061481476,
"step": 2925,
"valid_targets_mean": 3812.8,
"valid_targets_min": 518
},
{
"epoch": 4.209920920201294,
"grad_norm": 0.48867123793633094,
"learning_rate": 1.6450218297333e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09008172154426575,
"step": 2930,
"valid_targets_mean": 2935.0,
"valid_targets_min": 621
},
{
"epoch": 4.2171099928109275,
"grad_norm": 0.5048761048747257,
"learning_rate": 1.6379718586929235e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13712650537490845,
"step": 2935,
"valid_targets_mean": 4341.1,
"valid_targets_min": 564
},
{
"epoch": 4.224299065420561,
"grad_norm": 0.4903661529952285,
"learning_rate": 1.6309265353786777e-05,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12769557535648346,
"step": 2940,
"valid_targets_mean": 4333.5,
"valid_targets_min": 548
},
{
"epoch": 4.231488138030194,
"grad_norm": 0.5150498165284755,
"learning_rate": 1.6238859502385943e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07896912097930908,
"step": 2945,
"valid_targets_mean": 2458.0,
"valid_targets_min": 230
},
{
"epoch": 4.238677210639827,
"grad_norm": 0.5953862527405311,
"learning_rate": 1.6168501936598783e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12767180800437927,
"step": 2950,
"valid_targets_mean": 3435.4,
"valid_targets_min": 711
},
{
"epoch": 4.245866283249461,
"grad_norm": 0.5210564257953418,
"learning_rate": 1.609819355967744e-05,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1351774036884308,
"step": 2955,
"valid_targets_mean": 4328.6,
"valid_targets_min": 582
},
{
"epoch": 4.253055355859094,
"grad_norm": 0.5229807638300585,
"learning_rate": 1.6027935274242575e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09753084182739258,
"step": 2960,
"valid_targets_mean": 2665.4,
"valid_targets_min": 528
},
{
"epoch": 4.260244428468727,
"grad_norm": 0.4864103710763143,
"learning_rate": 1.5957727982271788e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10253024846315384,
"step": 2965,
"valid_targets_mean": 3451.0,
"valid_targets_min": 720
},
{
"epoch": 4.267433501078361,
"grad_norm": 0.5549949272831466,
"learning_rate": 1.5887572585087995e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08487284183502197,
"step": 2970,
"valid_targets_mean": 2780.6,
"valid_targets_min": 542
},
{
"epoch": 4.274622573687994,
"grad_norm": 0.45558638561523057,
"learning_rate": 1.5817469983347912e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12247081845998764,
"step": 2975,
"valid_targets_mean": 4601.6,
"valid_targets_min": 1034
},
{
"epoch": 4.281811646297627,
"grad_norm": 0.5024007698937418,
"learning_rate": 1.5747421077030442e-05,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10787507891654968,
"step": 2980,
"valid_targets_mean": 3700.0,
"valid_targets_min": 606
},
{
"epoch": 4.2890007189072605,
"grad_norm": 0.5082106914176634,
"learning_rate": 1.5677426765425166e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11795713007450104,
"step": 2985,
"valid_targets_mean": 3604.4,
"valid_targets_min": 731
},
{
"epoch": 4.296189791516895,
"grad_norm": 0.4499094022949875,
"learning_rate": 1.5607487947120766e-05,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1429499387741089,
"step": 2990,
"valid_targets_mean": 5784.1,
"valid_targets_min": 3691
},
{
"epoch": 4.303378864126528,
"grad_norm": 0.43554600462791326,
"learning_rate": 1.55376055199935e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13606850802898407,
"step": 2995,
"valid_targets_mean": 5484.5,
"valid_targets_min": 4161
},
{
"epoch": 4.310567936736161,
"grad_norm": 0.48479942765593714,
"learning_rate": 1.5467780381195675e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09615229070186615,
"step": 3000,
"valid_targets_mean": 3328.8,
"valid_targets_min": 546
},
{
"epoch": 4.317757009345795,
"grad_norm": 0.5483839501262737,
"learning_rate": 1.5398013427144136e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13533805310726166,
"step": 3005,
"valid_targets_mean": 3739.2,
"valid_targets_min": 528
},
{
"epoch": 4.324946081955428,
"grad_norm": 0.5325384384939251,
"learning_rate": 1.5328305553508737e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10858841985464096,
"step": 3010,
"valid_targets_mean": 3556.6,
"valid_targets_min": 867
},
{
"epoch": 4.332135154565061,
"grad_norm": 0.488394898199471,
"learning_rate": 1.5258657655200862e-05,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11653181165456772,
"step": 3015,
"valid_targets_mean": 3955.2,
"valid_targets_min": 557
},
{
"epoch": 4.339324227174695,
"grad_norm": 0.5105599359428391,
"learning_rate": 1.5189070626361941e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12870097160339355,
"step": 3020,
"valid_targets_mean": 4240.0,
"valid_targets_min": 702
},
{
"epoch": 4.346513299784328,
"grad_norm": 0.5715965859853566,
"learning_rate": 1.5119545360351957e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15724487602710724,
"step": 3025,
"valid_targets_mean": 3764.2,
"valid_targets_min": 566
},
{
"epoch": 4.353702372393961,
"grad_norm": 0.5896736194868126,
"learning_rate": 1.505008274973796e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13168630003929138,
"step": 3030,
"valid_targets_mean": 3176.2,
"valid_targets_min": 633
},
{
"epoch": 4.3608914450035945,
"grad_norm": 0.5156466323454092,
"learning_rate": 1.4980683686282657e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12574413418769836,
"step": 3035,
"valid_targets_mean": 3254.2,
"valid_targets_min": 645
},
{
"epoch": 4.368080517613228,
"grad_norm": 0.47988451535887794,
"learning_rate": 1.4911349060932909e-05,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11421344429254532,
"step": 3040,
"valid_targets_mean": 4213.0,
"valid_targets_min": 732
},
{
"epoch": 4.375269590222861,
"grad_norm": 0.5042870458706878,
"learning_rate": 1.484207976380834e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1530284583568573,
"step": 3045,
"valid_targets_mean": 4835.0,
"valid_targets_min": 918
},
{
"epoch": 4.382458662832494,
"grad_norm": 0.536704227286159,
"learning_rate": 1.4772876684189879e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13965827226638794,
"step": 3050,
"valid_targets_mean": 3876.8,
"valid_targets_min": 423
},
{
"epoch": 4.389647735442128,
"grad_norm": 0.46602382013395727,
"learning_rate": 1.4703740710508352e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12959733605384827,
"step": 3055,
"valid_targets_mean": 5016.6,
"valid_targets_min": 4090
},
{
"epoch": 4.396836808051761,
"grad_norm": 0.5514211790349896,
"learning_rate": 1.4634672730333079e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125798761844635,
"step": 3060,
"valid_targets_mean": 3335.4,
"valid_targets_min": 727
},
{
"epoch": 4.404025880661394,
"grad_norm": 0.5827049576069567,
"learning_rate": 1.4565673630360482e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09962286055088043,
"step": 3065,
"valid_targets_mean": 2581.2,
"valid_targets_min": 580
},
{
"epoch": 4.411214953271028,
"grad_norm": 0.47939759496807005,
"learning_rate": 1.4496744296402686e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0976216048002243,
"step": 3070,
"valid_targets_mean": 3415.2,
"valid_targets_min": 691
},
{
"epoch": 4.418404025880662,
"grad_norm": 0.502919510044186,
"learning_rate": 1.4427885613376176e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10967571288347244,
"step": 3075,
"valid_targets_mean": 3390.2,
"valid_targets_min": 559
},
{
"epoch": 4.425593098490295,
"grad_norm": 0.6305898129788904,
"learning_rate": 1.4359098465290401e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10862769186496735,
"step": 3080,
"valid_targets_mean": 2415.8,
"valid_targets_min": 786
},
{
"epoch": 4.4327821710999284,
"grad_norm": 0.5575222975267811,
"learning_rate": 1.4290383735236453e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10775524377822876,
"step": 3085,
"valid_targets_mean": 3085.9,
"valid_targets_min": 611
},
{
"epoch": 4.439971243709562,
"grad_norm": 0.49802953687828977,
"learning_rate": 1.4221742305375716e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0978183001279831,
"step": 3090,
"valid_targets_mean": 2689.6,
"valid_targets_min": 538
},
{
"epoch": 4.447160316319195,
"grad_norm": 0.5756490270686243,
"learning_rate": 1.4153175056928543e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09058581292629242,
"step": 3095,
"valid_targets_mean": 2022.0,
"valid_targets_min": 522
},
{
"epoch": 4.454349388928828,
"grad_norm": 0.5208077664252705,
"learning_rate": 1.408468287016295e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12745115160942078,
"step": 3100,
"valid_targets_mean": 3539.4,
"valid_targets_min": 602
},
{
"epoch": 4.461538461538462,
"grad_norm": 0.4377191730808559,
"learning_rate": 1.4016266624383299e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11340028047561646,
"step": 3105,
"valid_targets_mean": 4446.4,
"valid_targets_min": 680
},
{
"epoch": 4.468727534148095,
"grad_norm": 0.7054657373358831,
"learning_rate": 1.3947927197919038e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14070342481136322,
"step": 3110,
"valid_targets_mean": 2662.5,
"valid_targets_min": 507
},
{
"epoch": 4.475916606757728,
"grad_norm": 0.518522447767955,
"learning_rate": 1.387966546811338e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14628420770168304,
"step": 3115,
"valid_targets_mean": 4294.0,
"valid_targets_min": 675
},
{
"epoch": 4.483105679367362,
"grad_norm": 0.45175962309797224,
"learning_rate": 1.3811482311312092e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1265779733657837,
"step": 3120,
"valid_targets_mean": 4493.6,
"valid_targets_min": 3468
},
{
"epoch": 4.490294751976995,
"grad_norm": 0.5802694137312429,
"learning_rate": 1.3743378602852201e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10025407373905182,
"step": 3125,
"valid_targets_mean": 2324.8,
"valid_targets_min": 722
},
{
"epoch": 4.497483824586628,
"grad_norm": 0.5255053806019105,
"learning_rate": 1.3675355217050781e-05,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1405080258846283,
"step": 3130,
"valid_targets_mean": 4538.6,
"valid_targets_min": 814
},
{
"epoch": 4.5046728971962615,
"grad_norm": 0.5595718040895143,
"learning_rate": 1.360741302719373e-05,
"loss": 0.2333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13758280873298645,
"step": 3135,
"valid_targets_mean": 3494.5,
"valid_targets_min": 627
},
{
"epoch": 4.511861969805895,
"grad_norm": 0.49673632869856904,
"learning_rate": 1.3539552905524542e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12679347395896912,
"step": 3140,
"valid_targets_mean": 4069.8,
"valid_targets_min": 455
},
{
"epoch": 4.519051042415528,
"grad_norm": 0.4796342803182259,
"learning_rate": 1.347177572323311e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11640562862157822,
"step": 3145,
"valid_targets_mean": 3925.0,
"valid_targets_min": 954
},
{
"epoch": 4.526240115025161,
"grad_norm": 0.49543130568416427,
"learning_rate": 1.340408235044457e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1236979067325592,
"step": 3150,
"valid_targets_mean": 3800.5,
"valid_targets_min": 791
},
{
"epoch": 4.533429187634795,
"grad_norm": 0.45765247970692274,
"learning_rate": 1.3336473656208084e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12283189594745636,
"step": 3155,
"valid_targets_mean": 4273.1,
"valid_targets_min": 877
},
{
"epoch": 4.540618260244429,
"grad_norm": 0.5129923770235678,
"learning_rate": 1.326895050848573e-05,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13487502932548523,
"step": 3160,
"valid_targets_mean": 4268.9,
"valid_targets_min": 3321
},
{
"epoch": 4.547807332854061,
"grad_norm": 0.44141191686175985,
"learning_rate": 1.3201513774141321e-05,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12209541350603104,
"step": 3165,
"valid_targets_mean": 4852.6,
"valid_targets_min": 1859
},
{
"epoch": 4.5549964054636956,
"grad_norm": 0.4942636534490483,
"learning_rate": 1.3134164318929314e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09581250697374344,
"step": 3170,
"valid_targets_mean": 3307.5,
"valid_targets_min": 689
},
{
"epoch": 4.562185478073329,
"grad_norm": 0.47384730378168516,
"learning_rate": 1.306690300748365e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13601398468017578,
"step": 3175,
"valid_targets_mean": 4708.5,
"valid_targets_min": 3342
},
{
"epoch": 4.569374550682962,
"grad_norm": 0.5943206386606482,
"learning_rate": 1.2999730703306697e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12636137008666992,
"step": 3180,
"valid_targets_mean": 3298.8,
"valid_targets_min": 552
},
{
"epoch": 4.5765636232925955,
"grad_norm": 0.5239127580206798,
"learning_rate": 1.2932648268758132e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16251717507839203,
"step": 3185,
"valid_targets_mean": 5176.2,
"valid_targets_min": 859
},
{
"epoch": 4.583752695902229,
"grad_norm": 0.4661488811609455,
"learning_rate": 1.2865656565043896e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11450262367725372,
"step": 3190,
"valid_targets_mean": 4073.1,
"valid_targets_min": 1440
},
{
"epoch": 4.590941768511862,
"grad_norm": 0.509066791632617,
"learning_rate": 1.2798756452205119e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.104307621717453,
"step": 3195,
"valid_targets_mean": 3497.1,
"valid_targets_min": 651
},
{
"epoch": 4.598130841121495,
"grad_norm": 0.4906266924266068,
"learning_rate": 1.273194878910708e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1050233393907547,
"step": 3200,
"valid_targets_mean": 3821.8,
"valid_targets_min": 987
},
{
"epoch": 4.605319913731129,
"grad_norm": 0.5811645770283341,
"learning_rate": 1.2665234433428197e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10122254490852356,
"step": 3205,
"valid_targets_mean": 2902.4,
"valid_targets_min": 620
},
{
"epoch": 4.612508986340762,
"grad_norm": 0.4816881331945686,
"learning_rate": 1.2598614241648996e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12213660031557083,
"step": 3210,
"valid_targets_mean": 3917.1,
"valid_targets_min": 821
},
{
"epoch": 4.619698058950395,
"grad_norm": 0.610812993328097,
"learning_rate": 1.2532089069041132e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1288452297449112,
"step": 3215,
"valid_targets_mean": 3823.6,
"valid_targets_min": 794
},
{
"epoch": 4.626887131560029,
"grad_norm": 0.44024322286663997,
"learning_rate": 1.246565976965639e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1286042183637619,
"step": 3220,
"valid_targets_mean": 5272.4,
"valid_targets_min": 4339
},
{
"epoch": 4.634076204169662,
"grad_norm": 0.5473777106333456,
"learning_rate": 1.2399327196315751e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18179279565811157,
"step": 3225,
"valid_targets_mean": 4101.0,
"valid_targets_min": 700
},
{
"epoch": 4.641265276779295,
"grad_norm": 0.4742924751198838,
"learning_rate": 1.2333092200598402e-05,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11457015573978424,
"step": 3230,
"valid_targets_mean": 4462.1,
"valid_targets_min": 748
},
{
"epoch": 4.6484543493889285,
"grad_norm": 0.48078713086524894,
"learning_rate": 1.2266955632830846e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1189941018819809,
"step": 3235,
"valid_targets_mean": 3519.9,
"valid_targets_min": 620
},
{
"epoch": 4.655643421998562,
"grad_norm": 0.5044909830237237,
"learning_rate": 1.220091834207595e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13733816146850586,
"step": 3240,
"valid_targets_mean": 4848.1,
"valid_targets_min": 885
},
{
"epoch": 4.662832494608195,
"grad_norm": 0.6257029056964695,
"learning_rate": 1.2134981176122068e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12326426804065704,
"step": 3245,
"valid_targets_mean": 2731.6,
"valid_targets_min": 521
},
{
"epoch": 4.6700215672178285,
"grad_norm": 0.49878248364441824,
"learning_rate": 1.2069144981472151e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11302924901247025,
"step": 3250,
"valid_targets_mean": 3593.5,
"valid_targets_min": 584
},
{
"epoch": 4.677210639827463,
"grad_norm": 0.5530561603271289,
"learning_rate": 1.2003410603332886e-05,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09142284095287323,
"step": 3255,
"valid_targets_mean": 2795.4,
"valid_targets_min": 644
},
{
"epoch": 4.684399712437096,
"grad_norm": 0.4944302859327403,
"learning_rate": 1.1937778885603808e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12129175662994385,
"step": 3260,
"valid_targets_mean": 3967.4,
"valid_targets_min": 817
},
{
"epoch": 4.691588785046729,
"grad_norm": 0.4862312666118715,
"learning_rate": 1.187225067086653e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10455331951379776,
"step": 3265,
"valid_targets_mean": 3429.9,
"valid_targets_min": 602
},
{
"epoch": 4.698777857656363,
"grad_norm": 0.4994833360624931,
"learning_rate": 1.1806826800373863e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12258949130773544,
"step": 3270,
"valid_targets_mean": 3713.8,
"valid_targets_min": 774
},
{
"epoch": 4.705966930265996,
"grad_norm": 0.49940999662894353,
"learning_rate": 1.1741508114039064e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12433376908302307,
"step": 3275,
"valid_targets_mean": 4469.5,
"valid_targets_min": 583
},
{
"epoch": 4.713156002875629,
"grad_norm": 0.5623276876572705,
"learning_rate": 1.1676295450425026e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1007264107465744,
"step": 3280,
"valid_targets_mean": 2477.0,
"valid_targets_min": 727
},
{
"epoch": 4.7203450754852625,
"grad_norm": 0.555739824339317,
"learning_rate": 1.1611189646733502e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12210990488529205,
"step": 3285,
"valid_targets_mean": 3138.5,
"valid_targets_min": 651
},
{
"epoch": 4.727534148094896,
"grad_norm": 0.4994433206664333,
"learning_rate": 1.1546191538794417e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0810234323143959,
"step": 3290,
"valid_targets_mean": 3035.2,
"valid_targets_min": 555
},
{
"epoch": 4.734723220704529,
"grad_norm": 0.4854393794231303,
"learning_rate": 1.1481301961055058e-05,
"loss": 0.2403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10804124176502228,
"step": 3295,
"valid_targets_mean": 3984.9,
"valid_targets_min": 411
},
{
"epoch": 4.741912293314162,
"grad_norm": 0.5717087891184073,
"learning_rate": 1.14165217465694e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11047998070716858,
"step": 3300,
"valid_targets_mean": 2894.4,
"valid_targets_min": 761
},
{
"epoch": 4.749101365923796,
"grad_norm": 0.5418658879133041,
"learning_rate": 1.1351851726987441e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14435940980911255,
"step": 3305,
"valid_targets_mean": 3214.9,
"valid_targets_min": 604
},
{
"epoch": 4.756290438533429,
"grad_norm": 0.44613577875582505,
"learning_rate": 1.1287292732544462e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11927706003189087,
"step": 3310,
"valid_targets_mean": 3904.1,
"valid_targets_min": 708
},
{
"epoch": 4.763479511143062,
"grad_norm": 0.49545137174974385,
"learning_rate": 1.1222845592050416e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1117856502532959,
"step": 3315,
"valid_targets_mean": 4137.6,
"valid_targets_min": 926
},
{
"epoch": 4.770668583752696,
"grad_norm": 0.44613604063424483,
"learning_rate": 1.1158511132879254e-05,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08571384847164154,
"step": 3320,
"valid_targets_mean": 3550.2,
"valid_targets_min": 524
},
{
"epoch": 4.777857656362329,
"grad_norm": 0.5561329176868874,
"learning_rate": 1.109429018095836e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.174579918384552,
"step": 3325,
"valid_targets_mean": 3782.0,
"valid_targets_min": 632
},
{
"epoch": 4.785046728971962,
"grad_norm": 0.5036404755895384,
"learning_rate": 1.1030183560757873e-05,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10416017472743988,
"step": 3330,
"valid_targets_mean": 3204.6,
"valid_targets_min": 801
},
{
"epoch": 4.792235801581596,
"grad_norm": 0.5301785485503443,
"learning_rate": 1.0966192095280148e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077873557806015,
"step": 3335,
"valid_targets_mean": 3394.2,
"valid_targets_min": 493
},
{
"epoch": 4.79942487419123,
"grad_norm": 0.5472468768495766,
"learning_rate": 1.090231660604918e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10582281649112701,
"step": 3340,
"valid_targets_mean": 2981.2,
"valid_targets_min": 715
},
{
"epoch": 4.806613946800863,
"grad_norm": 0.5841063617132195,
"learning_rate": 1.0838557913100074e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08225120604038239,
"step": 3345,
"valid_targets_mean": 2107.0,
"valid_targets_min": 456
},
{
"epoch": 4.813803019410496,
"grad_norm": 0.5072600809639856,
"learning_rate": 1.0774916834968484e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10606703162193298,
"step": 3350,
"valid_targets_mean": 3230.5,
"valid_targets_min": 655
},
{
"epoch": 4.82099209202013,
"grad_norm": 0.5454695842764663,
"learning_rate": 1.0711394188680117e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09919101744890213,
"step": 3355,
"valid_targets_mean": 2742.1,
"valid_targets_min": 614
},
{
"epoch": 4.828181164629763,
"grad_norm": 0.577090532210789,
"learning_rate": 1.0647990789740269e-05,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14345696568489075,
"step": 3360,
"valid_targets_mean": 3700.5,
"valid_targets_min": 614
},
{
"epoch": 4.835370237239396,
"grad_norm": 0.599439746241527,
"learning_rate": 1.058470745212333e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1152365431189537,
"step": 3365,
"valid_targets_mean": 3038.6,
"valid_targets_min": 637
},
{
"epoch": 4.84255930984903,
"grad_norm": 0.4796989899141097,
"learning_rate": 1.0521544988262335e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08579153567552567,
"step": 3370,
"valid_targets_mean": 3213.6,
"valid_targets_min": 609
},
{
"epoch": 4.849748382458663,
"grad_norm": 0.6490810772399019,
"learning_rate": 1.0458504209038533e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14216336607933044,
"step": 3375,
"valid_targets_mean": 2942.9,
"valid_targets_min": 557
},
{
"epoch": 4.856937455068296,
"grad_norm": 0.4870269459652767,
"learning_rate": 1.0395585923770981e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09269210696220398,
"step": 3380,
"valid_targets_mean": 3761.9,
"valid_targets_min": 629
},
{
"epoch": 4.8641265276779295,
"grad_norm": 0.46747238467905033,
"learning_rate": 1.0332790940206183e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1230100691318512,
"step": 3385,
"valid_targets_mean": 4636.8,
"valid_targets_min": 2480
},
{
"epoch": 4.871315600287563,
"grad_norm": 0.6495857497948903,
"learning_rate": 1.0270120064507664e-05,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1402766853570938,
"step": 3390,
"valid_targets_mean": 4321.4,
"valid_targets_min": 1066
},
{
"epoch": 4.878504672897196,
"grad_norm": 0.47843085114562955,
"learning_rate": 1.0207574101245661e-05,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09787297248840332,
"step": 3395,
"valid_targets_mean": 3257.5,
"valid_targets_min": 860
},
{
"epoch": 4.885693745506829,
"grad_norm": 0.4826999323999703,
"learning_rate": 1.0145153853386764e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08830671012401581,
"step": 3400,
"valid_targets_mean": 2271.1,
"valid_targets_min": 582
},
{
"epoch": 4.892882818116463,
"grad_norm": 0.4933668590281263,
"learning_rate": 1.0082860122283667e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14057773351669312,
"step": 3405,
"valid_targets_mean": 4368.4,
"valid_targets_min": 775
},
{
"epoch": 4.900071890726096,
"grad_norm": 0.5820889582759022,
"learning_rate": 1.0020693707664799e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11664923280477524,
"step": 3410,
"valid_targets_mean": 3539.9,
"valid_targets_min": 670
},
{
"epoch": 4.907260963335729,
"grad_norm": 0.48946946217080056,
"learning_rate": 9.958655407624103e-06,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09979799389839172,
"step": 3415,
"valid_targets_mean": 3043.6,
"valid_targets_min": 688
},
{
"epoch": 4.914450035945363,
"grad_norm": 0.5073233040403398,
"learning_rate": 9.89674601861081e-06,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11947494745254517,
"step": 3420,
"valid_targets_mean": 4196.5,
"valid_targets_min": 1035
},
{
"epoch": 4.921639108554997,
"grad_norm": 0.7177282984792761,
"learning_rate": 9.83496633541916e-06,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12936556339263916,
"step": 3425,
"valid_targets_mean": 3776.4,
"valid_targets_min": 842
},
{
"epoch": 4.928828181164629,
"grad_norm": 0.5118285957400573,
"learning_rate": 9.773317151178239e-06,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13362133502960205,
"step": 3430,
"valid_targets_mean": 4502.4,
"valid_targets_min": 779
},
{
"epoch": 4.9360172537742635,
"grad_norm": 0.5443810213820736,
"learning_rate": 9.711799257341772e-06,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10535494983196259,
"step": 3435,
"valid_targets_mean": 3771.1,
"valid_targets_min": 673
},
{
"epoch": 4.943206326383897,
"grad_norm": 0.5591247338648125,
"learning_rate": 9.650413443678e-06,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13685429096221924,
"step": 3440,
"valid_targets_mean": 3843.8,
"valid_targets_min": 979
},
{
"epoch": 4.95039539899353,
"grad_norm": 0.4678569233701499,
"learning_rate": 9.58916049825949e-06,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1224527508020401,
"step": 3445,
"valid_targets_mean": 4677.8,
"valid_targets_min": 3661
},
{
"epoch": 4.957584471603163,
"grad_norm": 0.5440934246700909,
"learning_rate": 9.528041207453056e-06,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15713685750961304,
"step": 3450,
"valid_targets_mean": 5048.0,
"valid_targets_min": 965
},
{
"epoch": 4.964773544212797,
"grad_norm": 0.49743408684165086,
"learning_rate": 9.467056355909639e-06,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08757054060697556,
"step": 3455,
"valid_targets_mean": 3058.4,
"valid_targets_min": 412
},
{
"epoch": 4.97196261682243,
"grad_norm": 0.48083670685811697,
"learning_rate": 9.40620672655427e-06,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10417330265045166,
"step": 3460,
"valid_targets_mean": 3597.5,
"valid_targets_min": 682
},
{
"epoch": 4.979151689432063,
"grad_norm": 0.5179283083362081,
"learning_rate": 9.34549310057597e-06,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11766026169061661,
"step": 3465,
"valid_targets_mean": 3463.0,
"valid_targets_min": 675
},
{
"epoch": 4.986340762041697,
"grad_norm": 0.4837812594204367,
"learning_rate": 9.284916257417746e-06,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18496853113174438,
"step": 3470,
"valid_targets_mean": 5729.2,
"valid_targets_min": 950
},
{
"epoch": 4.99352983465133,
"grad_norm": 0.4904953793566584,
"learning_rate": 9.2244769747666e-06,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.135883167386055,
"step": 3475,
"valid_targets_mean": 4532.1,
"valid_targets_min": 761
},
{
"epoch": 5.0,
"grad_norm": 0.7004899366166182,
"learning_rate": 9.16417602854353e-06,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21526622772216797,
"step": 3480,
"valid_targets_mean": 3061.6,
"valid_targets_min": 677
},
{
"epoch": 5.007189072609633,
"grad_norm": 0.5375983632773035,
"learning_rate": 9.104014192893547e-06,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13673044741153717,
"step": 3485,
"valid_targets_mean": 3982.0,
"valid_targets_min": 862
},
{
"epoch": 5.014378145219267,
"grad_norm": 0.5074525307969784,
"learning_rate": 9.04399224017577e-06,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08781856298446655,
"step": 3490,
"valid_targets_mean": 2563.9,
"valid_targets_min": 565
},
{
"epoch": 5.0215672178289,
"grad_norm": 0.5226625346422593,
"learning_rate": 8.984110940953485e-06,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11326141655445099,
"step": 3495,
"valid_targets_mean": 4074.4,
"valid_targets_min": 662
},
{
"epoch": 5.028756290438533,
"grad_norm": 0.5085797015984954,
"learning_rate": 8.924371063984294e-06,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11057010293006897,
"step": 3500,
"valid_targets_mean": 4120.9,
"valid_targets_min": 455
},
{
"epoch": 5.0359453630481665,
"grad_norm": 0.4769148575385776,
"learning_rate": 8.86477337621019e-06,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12291170656681061,
"step": 3505,
"valid_targets_mean": 4678.4,
"valid_targets_min": 3405
},
{
"epoch": 5.0431344356578,
"grad_norm": 0.5564512722540663,
"learning_rate": 8.805318642747746e-06,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11856968700885773,
"step": 3510,
"valid_targets_mean": 3500.5,
"valid_targets_min": 624
},
{
"epoch": 5.050323508267433,
"grad_norm": 0.5566437898397325,
"learning_rate": 8.746007626878274e-06,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10583490133285522,
"step": 3515,
"valid_targets_mean": 3376.5,
"valid_targets_min": 747
},
{
"epoch": 5.0575125808770665,
"grad_norm": 0.6086364544635542,
"learning_rate": 8.686841090038066e-06,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12775224447250366,
"step": 3520,
"valid_targets_mean": 3280.1,
"valid_targets_min": 551
},
{
"epoch": 5.064701653486701,
"grad_norm": 0.5185408192200104,
"learning_rate": 8.627819791808557e-06,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1279093325138092,
"step": 3525,
"valid_targets_mean": 4133.9,
"valid_targets_min": 487
},
{
"epoch": 5.071890726096334,
"grad_norm": 0.5301333550786779,
"learning_rate": 8.568944489906608e-06,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13012029230594635,
"step": 3530,
"valid_targets_mean": 4145.6,
"valid_targets_min": 893
},
{
"epoch": 5.079079798705967,
"grad_norm": 0.5183690582049101,
"learning_rate": 8.510215940174802e-06,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13085518777370453,
"step": 3535,
"valid_targets_mean": 5321.9,
"valid_targets_min": 597
},
{
"epoch": 5.086268871315601,
"grad_norm": 0.4579516502915308,
"learning_rate": 8.45163489657169e-06,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11568126827478409,
"step": 3540,
"valid_targets_mean": 3944.9,
"valid_targets_min": 731
},
{
"epoch": 5.093457943925234,
"grad_norm": 0.5507002546950306,
"learning_rate": 8.393202111162139e-06,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09243332594633102,
"step": 3545,
"valid_targets_mean": 3075.0,
"valid_targets_min": 591
},
{
"epoch": 5.100647016534867,
"grad_norm": 0.5383009778697873,
"learning_rate": 8.334918334107673e-06,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1040419340133667,
"step": 3550,
"valid_targets_mean": 3633.8,
"valid_targets_min": 711
},
{
"epoch": 5.1078360891445005,
"grad_norm": 0.5757360955048402,
"learning_rate": 8.276784313656857e-06,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11551609635353088,
"step": 3555,
"valid_targets_mean": 3326.9,
"valid_targets_min": 601
},
{
"epoch": 5.115025161754134,
"grad_norm": 0.5291511551810913,
"learning_rate": 8.218800796135666e-06,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1199103370308876,
"step": 3560,
"valid_targets_mean": 3476.9,
"valid_targets_min": 635
},
{
"epoch": 5.122214234363767,
"grad_norm": 0.5415093823430597,
"learning_rate": 8.16096852593791e-06,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1012372300028801,
"step": 3565,
"valid_targets_mean": 3252.1,
"valid_targets_min": 616
},
{
"epoch": 5.1294033069734,
"grad_norm": 0.5573860753092026,
"learning_rate": 8.103288245515681e-06,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514764130115509,
"step": 3570,
"valid_targets_mean": 5006.4,
"valid_targets_min": 879
},
{
"epoch": 5.136592379583034,
"grad_norm": 0.5223848215183271,
"learning_rate": 8.045760695369847e-06,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12808704376220703,
"step": 3575,
"valid_targets_mean": 4967.6,
"valid_targets_min": 471
},
{
"epoch": 5.143781452192667,
"grad_norm": 0.5143444928109423,
"learning_rate": 7.988386614040494e-06,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1381615698337555,
"step": 3580,
"valid_targets_mean": 4538.1,
"valid_targets_min": 849
},
{
"epoch": 5.1509705248023,
"grad_norm": 0.5182514437257415,
"learning_rate": 7.931166738097475e-06,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09853020310401917,
"step": 3585,
"valid_targets_mean": 2926.4,
"valid_targets_min": 568
},
{
"epoch": 5.158159597411934,
"grad_norm": 0.5520568816361435,
"learning_rate": 7.874101802130962e-06,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408407986164093,
"step": 3590,
"valid_targets_mean": 4108.1,
"valid_targets_min": 572
},
{
"epoch": 5.165348670021567,
"grad_norm": 0.5558116754962581,
"learning_rate": 7.817192538742006e-06,
"loss": 0.233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14348295331001282,
"step": 3595,
"valid_targets_mean": 4215.8,
"valid_targets_min": 581
},
{
"epoch": 5.1725377426312,
"grad_norm": 0.4732036564036685,
"learning_rate": 7.760439678533116e-06,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10638897120952606,
"step": 3600,
"valid_targets_mean": 4069.9,
"valid_targets_min": 655
},
{
"epoch": 5.179726815240834,
"grad_norm": 0.46187611868482703,
"learning_rate": 7.703843950098896e-06,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12339513003826141,
"step": 3605,
"valid_targets_mean": 4986.5,
"valid_targets_min": 3772
},
{
"epoch": 5.186915887850467,
"grad_norm": 0.47709162253072873,
"learning_rate": 7.647406080016689e-06,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10468283295631409,
"step": 3610,
"valid_targets_mean": 4060.6,
"valid_targets_min": 516
},
{
"epoch": 5.194104960460101,
"grad_norm": 0.4666448228118238,
"learning_rate": 7.59112679283726e-06,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10728386789560318,
"step": 3615,
"valid_targets_mean": 4606.5,
"valid_targets_min": 689
},
{
"epoch": 5.201294033069734,
"grad_norm": 0.47925545974428047,
"learning_rate": 7.535006811075472e-06,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14180710911750793,
"step": 3620,
"valid_targets_mean": 5071.1,
"valid_targets_min": 572
},
{
"epoch": 5.208483105679368,
"grad_norm": 0.580957255481736,
"learning_rate": 7.479046855201018e-06,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17155005037784576,
"step": 3625,
"valid_targets_mean": 4656.0,
"valid_targets_min": 604
},
{
"epoch": 5.215672178289001,
"grad_norm": 0.5079874024744255,
"learning_rate": 7.4232476436291766e-06,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1037202775478363,
"step": 3630,
"valid_targets_mean": 3508.1,
"valid_targets_min": 818
},
{
"epoch": 5.222861250898634,
"grad_norm": 0.5341354860008051,
"learning_rate": 7.3676098927116e-06,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12585100531578064,
"step": 3635,
"valid_targets_mean": 3564.9,
"valid_targets_min": 802
},
{
"epoch": 5.230050323508268,
"grad_norm": 0.654732208865685,
"learning_rate": 7.312134316727093e-06,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1112690344452858,
"step": 3640,
"valid_targets_mean": 4563.2,
"valid_targets_min": 897
},
{
"epoch": 5.237239396117901,
"grad_norm": 0.627062993991902,
"learning_rate": 7.256821627872448e-06,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12680819630622864,
"step": 3645,
"valid_targets_mean": 3043.4,
"valid_targets_min": 493
},
{
"epoch": 5.244428468727534,
"grad_norm": 0.4696774303220318,
"learning_rate": 7.2016725362533276e-06,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09891338646411896,
"step": 3650,
"valid_targets_mean": 3879.6,
"valid_targets_min": 661
},
{
"epoch": 5.2516175413371675,
"grad_norm": 0.5242072466435919,
"learning_rate": 7.146687749875116e-06,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13201574981212616,
"step": 3655,
"valid_targets_mean": 5096.6,
"valid_targets_min": 693
},
{
"epoch": 5.258806613946801,
"grad_norm": 0.5949854365395237,
"learning_rate": 7.091867974633841e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10788040608167648,
"step": 3660,
"valid_targets_mean": 2561.8,
"valid_targets_min": 558
},
{
"epoch": 5.265995686556434,
"grad_norm": 0.5240634062040213,
"learning_rate": 7.037213914307115e-06,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10503746569156647,
"step": 3665,
"valid_targets_mean": 3181.1,
"valid_targets_min": 523
},
{
"epoch": 5.273184759166067,
"grad_norm": 0.5267318614037361,
"learning_rate": 6.9827262705451105e-06,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1396285593509674,
"step": 3670,
"valid_targets_mean": 4749.4,
"valid_targets_min": 656
},
{
"epoch": 5.280373831775701,
"grad_norm": 0.47731072982521167,
"learning_rate": 6.928405742861526e-06,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1177634596824646,
"step": 3675,
"valid_targets_mean": 4171.5,
"valid_targets_min": 464
},
{
"epoch": 5.287562904385334,
"grad_norm": 0.5068202864119911,
"learning_rate": 6.874253028624625e-06,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10211893916130066,
"step": 3680,
"valid_targets_mean": 3619.4,
"valid_targets_min": 902
},
{
"epoch": 5.294751976994967,
"grad_norm": 0.5016652817729716,
"learning_rate": 6.820268823048266e-06,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13110285997390747,
"step": 3685,
"valid_targets_mean": 4559.0,
"valid_targets_min": 739
},
{
"epoch": 5.301941049604601,
"grad_norm": 0.5322028847511757,
"learning_rate": 6.7664538191830165e-06,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1111895740032196,
"step": 3690,
"valid_targets_mean": 3257.4,
"valid_targets_min": 746
},
{
"epoch": 5.309130122214234,
"grad_norm": 0.5242815050747506,
"learning_rate": 6.712808707907206e-06,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09911448508501053,
"step": 3695,
"valid_targets_mean": 3859.8,
"valid_targets_min": 855
},
{
"epoch": 5.316319194823867,
"grad_norm": 0.5274184494318976,
"learning_rate": 6.659334177918075e-06,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10168007016181946,
"step": 3700,
"valid_targets_mean": 2894.0,
"valid_targets_min": 649
},
{
"epoch": 5.3235082674335015,
"grad_norm": 0.5580532302216001,
"learning_rate": 6.6060309157229566e-06,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12171245366334915,
"step": 3705,
"valid_targets_mean": 3291.8,
"valid_targets_min": 532
},
{
"epoch": 5.330697340043135,
"grad_norm": 0.5325308799675936,
"learning_rate": 6.55289960563044e-06,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10376730561256409,
"step": 3710,
"valid_targets_mean": 3438.8,
"valid_targets_min": 604
},
{
"epoch": 5.337886412652768,
"grad_norm": 0.5586213161057807,
"learning_rate": 6.499940929741577e-06,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09677755832672119,
"step": 3715,
"valid_targets_mean": 2735.0,
"valid_targets_min": 620
},
{
"epoch": 5.345075485262401,
"grad_norm": 0.5663803576851734,
"learning_rate": 6.447155567941141e-06,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11576307564973831,
"step": 3720,
"valid_targets_mean": 3961.1,
"valid_targets_min": 645
},
{
"epoch": 5.352264557872035,
"grad_norm": 0.47758908764240937,
"learning_rate": 6.394544197888895e-06,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08779515326023102,
"step": 3725,
"valid_targets_mean": 3460.2,
"valid_targets_min": 666
},
{
"epoch": 5.359453630481668,
"grad_norm": 0.5371407252655028,
"learning_rate": 6.342107495010903e-06,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1303025633096695,
"step": 3730,
"valid_targets_mean": 3453.9,
"valid_targets_min": 582
},
{
"epoch": 5.366642703091301,
"grad_norm": 0.5433261944894747,
"learning_rate": 6.289846132490836e-06,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10139200091362,
"step": 3735,
"valid_targets_mean": 3614.2,
"valid_targets_min": 485
},
{
"epoch": 5.373831775700935,
"grad_norm": 0.4892527224392483,
"learning_rate": 6.237760781261339e-06,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12653936445713043,
"step": 3740,
"valid_targets_mean": 4815.8,
"valid_targets_min": 3923
},
{
"epoch": 5.381020848310568,
"grad_norm": 0.6281676767553033,
"learning_rate": 6.185852109995423e-06,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14503289759159088,
"step": 3745,
"valid_targets_mean": 4049.6,
"valid_targets_min": 577
},
{
"epoch": 5.388209920920201,
"grad_norm": 0.5139220394937787,
"learning_rate": 6.1341207850978905e-06,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09314952790737152,
"step": 3750,
"valid_targets_mean": 3192.6,
"valid_targets_min": 647
},
{
"epoch": 5.3953989935298345,
"grad_norm": 0.5836967326755717,
"learning_rate": 6.082567470696747e-06,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11038590967655182,
"step": 3755,
"valid_targets_mean": 3321.2,
"valid_targets_min": 691
},
{
"epoch": 5.402588066139468,
"grad_norm": 0.5862170542230964,
"learning_rate": 6.0311928286347e-06,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.150666743516922,
"step": 3760,
"valid_targets_mean": 4635.4,
"valid_targets_min": 4223
},
{
"epoch": 5.409777138749101,
"grad_norm": 0.5619243601117232,
"learning_rate": 5.97999751846067e-06,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11010795086622238,
"step": 3765,
"valid_targets_mean": 3656.0,
"valid_targets_min": 830
},
{
"epoch": 5.4169662113587345,
"grad_norm": 0.4793247356400887,
"learning_rate": 5.9289821974212956e-06,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0704135149717331,
"step": 3770,
"valid_targets_mean": 2109.9,
"valid_targets_min": 330
},
{
"epoch": 5.424155283968368,
"grad_norm": 0.517481898207876,
"learning_rate": 5.878147520452517e-06,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10165617614984512,
"step": 3775,
"valid_targets_mean": 3652.1,
"valid_targets_min": 567
},
{
"epoch": 5.431344356578001,
"grad_norm": 0.6135944967500202,
"learning_rate": 5.827494140171152e-06,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09592735767364502,
"step": 3780,
"valid_targets_mean": 2568.6,
"valid_targets_min": 486
},
{
"epoch": 5.438533429187634,
"grad_norm": 0.49746523639145324,
"learning_rate": 5.7770227068665485e-06,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0968160480260849,
"step": 3785,
"valid_targets_mean": 3214.0,
"valid_targets_min": 699
},
{
"epoch": 5.445722501797269,
"grad_norm": 0.6088131457344995,
"learning_rate": 5.726733868492196e-06,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12237273901700974,
"step": 3790,
"valid_targets_mean": 2801.8,
"valid_targets_min": 704
},
{
"epoch": 5.452911574406902,
"grad_norm": 0.4755640662150841,
"learning_rate": 5.676628270657429e-06,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10788771510124207,
"step": 3795,
"valid_targets_mean": 3890.1,
"valid_targets_min": 767
},
{
"epoch": 5.460100647016535,
"grad_norm": 0.5564304734402853,
"learning_rate": 5.626706556619132e-06,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11956202983856201,
"step": 3800,
"valid_targets_mean": 3888.9,
"valid_targets_min": 828
},
{
"epoch": 5.4672897196261685,
"grad_norm": 0.5718654277621241,
"learning_rate": 5.576969367273506e-06,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13896629214286804,
"step": 3805,
"valid_targets_mean": 4125.5,
"valid_targets_min": 710
},
{
"epoch": 5.474478792235802,
"grad_norm": 0.5032497846155108,
"learning_rate": 5.527417341147794e-06,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09287270903587341,
"step": 3810,
"valid_targets_mean": 3537.1,
"valid_targets_min": 686
},
{
"epoch": 5.481667864845435,
"grad_norm": 0.4915204373542724,
"learning_rate": 5.4780511143921115e-06,
"loss": 0.23,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1148151308298111,
"step": 3815,
"valid_targets_mean": 4444.5,
"valid_targets_min": 617
},
{
"epoch": 5.488856937455068,
"grad_norm": 0.6047640594429146,
"learning_rate": 5.428871320771296e-06,
"loss": 0.233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1029304563999176,
"step": 3820,
"valid_targets_mean": 2823.0,
"valid_targets_min": 772
},
{
"epoch": 5.496046010064702,
"grad_norm": 0.510548508866447,
"learning_rate": 5.379878591656742e-06,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1139189675450325,
"step": 3825,
"valid_targets_mean": 3634.5,
"valid_targets_min": 534
},
{
"epoch": 5.503235082674335,
"grad_norm": 0.5003942789953372,
"learning_rate": 5.3310735560183e-06,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11003319919109344,
"step": 3830,
"valid_targets_mean": 4281.6,
"valid_targets_min": 949
},
{
"epoch": 5.510424155283968,
"grad_norm": 0.6576710045774764,
"learning_rate": 5.28245684041621e-06,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1553100049495697,
"step": 3835,
"valid_targets_mean": 3864.1,
"valid_targets_min": 718
},
{
"epoch": 5.517613227893602,
"grad_norm": 0.47410941520350275,
"learning_rate": 5.2340290689930515e-06,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11888614296913147,
"step": 3840,
"valid_targets_mean": 3732.5,
"valid_targets_min": 732
},
{
"epoch": 5.524802300503235,
"grad_norm": 0.5085462942465262,
"learning_rate": 5.185790863465747e-06,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10465127229690552,
"step": 3845,
"valid_targets_mean": 3367.5,
"valid_targets_min": 685
},
{
"epoch": 5.531991373112868,
"grad_norm": 0.4801234294164676,
"learning_rate": 5.137742843117555e-06,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09817088395357132,
"step": 3850,
"valid_targets_mean": 3293.4,
"valid_targets_min": 564
},
{
"epoch": 5.539180445722502,
"grad_norm": 0.5305608181594179,
"learning_rate": 5.089885624790134e-06,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09850573539733887,
"step": 3855,
"valid_targets_mean": 3317.8,
"valid_targets_min": 679
},
{
"epoch": 5.546369518332135,
"grad_norm": 0.6077286044826221,
"learning_rate": 5.042219822875618e-06,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10427510738372803,
"step": 3860,
"valid_targets_mean": 3405.0,
"valid_targets_min": 655
},
{
"epoch": 5.553558590941768,
"grad_norm": 0.5246120803533588,
"learning_rate": 4.994746049308747e-06,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11735428869724274,
"step": 3865,
"valid_targets_mean": 3809.6,
"valid_targets_min": 878
},
{
"epoch": 5.5607476635514015,
"grad_norm": 0.605950559060801,
"learning_rate": 4.947464913558986e-06,
"loss": 0.2333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11098338663578033,
"step": 3870,
"valid_targets_mean": 4339.1,
"valid_targets_min": 751
},
{
"epoch": 5.567936736161036,
"grad_norm": 0.580577525790607,
"learning_rate": 4.900377022622702e-06,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15154002606868744,
"step": 3875,
"valid_targets_mean": 3963.5,
"valid_targets_min": 916
},
{
"epoch": 5.575125808770668,
"grad_norm": 0.5518840282788854,
"learning_rate": 4.8534829810154e-06,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12235703319311142,
"step": 3880,
"valid_targets_mean": 4262.4,
"valid_targets_min": 411
},
{
"epoch": 5.582314881380302,
"grad_norm": 0.555269161273212,
"learning_rate": 4.806783390763932e-06,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09165024757385254,
"step": 3885,
"valid_targets_mean": 3564.1,
"valid_targets_min": 615
},
{
"epoch": 5.589503953989936,
"grad_norm": 0.47658903316409296,
"learning_rate": 4.760278851398776e-06,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0927685797214508,
"step": 3890,
"valid_targets_mean": 3430.5,
"valid_targets_min": 756
},
{
"epoch": 5.596693026599569,
"grad_norm": 0.5813698001221245,
"learning_rate": 4.7139699599463426e-06,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1289849877357483,
"step": 3895,
"valid_targets_mean": 3189.4,
"valid_targets_min": 593
},
{
"epoch": 5.603882099209202,
"grad_norm": 0.5485491518781684,
"learning_rate": 4.66785731092132e-06,
"loss": 0.2303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10561780631542206,
"step": 3900,
"valid_targets_mean": 3082.2,
"valid_targets_min": 624
},
{
"epoch": 5.6110711718188355,
"grad_norm": 0.6088578449194925,
"learning_rate": 4.621941496319023e-06,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12965992093086243,
"step": 3905,
"valid_targets_mean": 3030.9,
"valid_targets_min": 539
},
{
"epoch": 5.618260244428469,
"grad_norm": 0.5743980711000396,
"learning_rate": 4.5762231056077976e-06,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11457179486751556,
"step": 3910,
"valid_targets_mean": 3469.0,
"valid_targets_min": 613
},
{
"epoch": 5.625449317038102,
"grad_norm": 0.5735979192233173,
"learning_rate": 4.530702725721456e-06,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16201013326644897,
"step": 3915,
"valid_targets_mean": 4685.4,
"valid_targets_min": 716
},
{
"epoch": 5.632638389647735,
"grad_norm": 0.5314576556957686,
"learning_rate": 4.485380941051764e-06,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13539963960647583,
"step": 3920,
"valid_targets_mean": 4214.4,
"valid_targets_min": 2348
},
{
"epoch": 5.639827462257369,
"grad_norm": 0.4962243478682359,
"learning_rate": 4.4402583334408925e-06,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1239946112036705,
"step": 3925,
"valid_targets_mean": 4401.9,
"valid_targets_min": 772
},
{
"epoch": 5.647016534867002,
"grad_norm": 0.5608654561683951,
"learning_rate": 4.3953354821739745e-06,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10213188081979752,
"step": 3930,
"valid_targets_mean": 3199.0,
"valid_targets_min": 595
},
{
"epoch": 5.654205607476635,
"grad_norm": 0.4264040054006142,
"learning_rate": 4.350612963971683e-06,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11011867970228195,
"step": 3935,
"valid_targets_mean": 5150.9,
"valid_targets_min": 4219
},
{
"epoch": 5.661394680086269,
"grad_norm": 0.7527457817817157,
"learning_rate": 4.3060913529828e-06,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13459980487823486,
"step": 3940,
"valid_targets_mean": 4806.9,
"valid_targets_min": 4005
},
{
"epoch": 5.668583752695902,
"grad_norm": 0.5037853732946838,
"learning_rate": 4.261771220776856e-06,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10649976134300232,
"step": 3945,
"valid_targets_mean": 4182.1,
"valid_targets_min": 939
},
{
"epoch": 5.675772825305535,
"grad_norm": 0.49120828952402623,
"learning_rate": 4.217653136336788e-06,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10088129341602325,
"step": 3950,
"valid_targets_mean": 3940.2,
"valid_targets_min": 612
},
{
"epoch": 5.682961897915169,
"grad_norm": 0.5345061789069356,
"learning_rate": 4.173737666051638e-06,
"loss": 0.2285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11330173909664154,
"step": 3955,
"valid_targets_mean": 3495.2,
"valid_targets_min": 634
},
{
"epoch": 5.690150970524803,
"grad_norm": 0.5495034857434233,
"learning_rate": 4.1300253737092985e-06,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08555985987186432,
"step": 3960,
"valid_targets_mean": 2754.5,
"valid_targets_min": 558
},
{
"epoch": 5.697340043134435,
"grad_norm": 0.5504471166752093,
"learning_rate": 4.086516820489244e-06,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11938584595918655,
"step": 3965,
"valid_targets_mean": 4737.6,
"valid_targets_min": 818
},
{
"epoch": 5.704529115744069,
"grad_norm": 0.7024099146976166,
"learning_rate": 4.043212564955341e-06,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11366365849971771,
"step": 3970,
"valid_targets_mean": 3613.2,
"valid_targets_min": 769
},
{
"epoch": 5.711718188353703,
"grad_norm": 0.5567797213556551,
"learning_rate": 4.000113163048678e-06,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12813721597194672,
"step": 3975,
"valid_targets_mean": 3827.0,
"valid_targets_min": 753
},
{
"epoch": 5.718907260963336,
"grad_norm": 0.4820690425614344,
"learning_rate": 3.957219168080439e-06,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08902594447135925,
"step": 3980,
"valid_targets_mean": 3253.6,
"valid_targets_min": 629
},
{
"epoch": 5.726096333572969,
"grad_norm": 0.5241838560174583,
"learning_rate": 3.914531130724777e-06,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10416141152381897,
"step": 3985,
"valid_targets_mean": 3481.9,
"valid_targets_min": 673
},
{
"epoch": 5.733285406182603,
"grad_norm": 0.55638613732615,
"learning_rate": 3.872049599011754e-06,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.087767094373703,
"step": 3990,
"valid_targets_mean": 2224.9,
"valid_targets_min": 611
},
{
"epoch": 5.740474478792236,
"grad_norm": 0.5096808510890435,
"learning_rate": 3.829775118320322e-06,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12581051886081696,
"step": 3995,
"valid_targets_mean": 4320.4,
"valid_targets_min": 991
},
{
"epoch": 5.747663551401869,
"grad_norm": 0.5525616374673865,
"learning_rate": 3.7877082313712944e-06,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11794079840183258,
"step": 4000,
"valid_targets_mean": 3695.4,
"valid_targets_min": 877
},
{
"epoch": 5.7548526240115025,
"grad_norm": 0.5443711074253681,
"learning_rate": 3.7458494782203915e-06,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13976985216140747,
"step": 4005,
"valid_targets_mean": 4345.1,
"valid_targets_min": 702
},
{
"epoch": 5.762041696621136,
"grad_norm": 0.5340557650606426,
"learning_rate": 3.7041993962513066e-06,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10117100179195404,
"step": 4010,
"valid_targets_mean": 3320.6,
"valid_targets_min": 743
},
{
"epoch": 5.769230769230769,
"grad_norm": 0.4803688175797287,
"learning_rate": 3.662758520168821e-06,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08951431512832642,
"step": 4015,
"valid_targets_mean": 3885.5,
"valid_targets_min": 705
},
{
"epoch": 5.7764198418404025,
"grad_norm": 0.48476516277316617,
"learning_rate": 3.6215273819919095e-06,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12080979347229004,
"step": 4020,
"valid_targets_mean": 4147.9,
"valid_targets_min": 489
},
{
"epoch": 5.783608914450036,
"grad_norm": 0.6249752714144173,
"learning_rate": 3.5805065110469306e-06,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13403496146202087,
"step": 4025,
"valid_targets_mean": 3137.0,
"valid_targets_min": 864
},
{
"epoch": 5.790797987059669,
"grad_norm": 0.5364924278381279,
"learning_rate": 3.5396964339608266e-06,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11756608635187149,
"step": 4030,
"valid_targets_mean": 4123.2,
"valid_targets_min": 635
},
{
"epoch": 5.797987059669302,
"grad_norm": 0.5109349298834557,
"learning_rate": 3.4990976746543727e-06,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10641781985759735,
"step": 4035,
"valid_targets_mean": 3795.5,
"valid_targets_min": 865
},
{
"epoch": 5.805176132278936,
"grad_norm": 0.5425174482086091,
"learning_rate": 3.4587107543354236e-06,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10321540385484695,
"step": 4040,
"valid_targets_mean": 3321.0,
"valid_targets_min": 507
},
{
"epoch": 5.812365204888569,
"grad_norm": 0.4547290274337963,
"learning_rate": 3.4185361914922588e-06,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10309769958257675,
"step": 4045,
"valid_targets_mean": 4833.1,
"valid_targets_min": 762
},
{
"epoch": 5.819554277498202,
"grad_norm": 0.6674311050708079,
"learning_rate": 3.378574501886891e-06,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14393368363380432,
"step": 4050,
"valid_targets_mean": 3134.4,
"valid_targets_min": 683
},
{
"epoch": 5.8267433501078365,
"grad_norm": 0.5103372393228983,
"learning_rate": 3.338826198548477e-06,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09888037294149399,
"step": 4055,
"valid_targets_mean": 4051.0,
"valid_targets_min": 844
},
{
"epoch": 5.83393242271747,
"grad_norm": 0.5656063140256278,
"learning_rate": 3.299291791766703e-06,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09367987513542175,
"step": 4060,
"valid_targets_mean": 2694.8,
"valid_targets_min": 482
},
{
"epoch": 5.841121495327103,
"grad_norm": 0.8203760991873118,
"learning_rate": 3.2599717890852502e-06,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13091842830181122,
"step": 4065,
"valid_targets_mean": 3690.6,
"valid_targets_min": 592
},
{
"epoch": 5.848310567936736,
"grad_norm": 1.1540642624867812,
"learning_rate": 3.220866695295266e-06,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09300343692302704,
"step": 4070,
"valid_targets_mean": 2594.1,
"valid_targets_min": 606
},
{
"epoch": 5.85549964054637,
"grad_norm": 0.5416675522579539,
"learning_rate": 3.181977012428914e-06,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09534624218940735,
"step": 4075,
"valid_targets_mean": 3515.5,
"valid_targets_min": 659
},
{
"epoch": 5.862688713156003,
"grad_norm": 0.5680889544101823,
"learning_rate": 3.143303239752886e-06,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10078851878643036,
"step": 4080,
"valid_targets_mean": 3410.9,
"valid_targets_min": 839
},
{
"epoch": 5.869877785765636,
"grad_norm": 0.48763425732795723,
"learning_rate": 3.1048458737620258e-06,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12355795502662659,
"step": 4085,
"valid_targets_mean": 4751.1,
"valid_targets_min": 3760
},
{
"epoch": 5.87706685837527,
"grad_norm": 0.5255237214520677,
"learning_rate": 3.066605408172929e-06,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09903688728809357,
"step": 4090,
"valid_targets_mean": 3674.5,
"valid_targets_min": 948
},
{
"epoch": 5.884255930984903,
"grad_norm": 0.6092363999584978,
"learning_rate": 3.028582333917638e-06,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10750824213027954,
"step": 4095,
"valid_targets_mean": 3747.6,
"valid_targets_min": 940
},
{
"epoch": 5.891445003594536,
"grad_norm": 0.46322807716375014,
"learning_rate": 2.9907771391373087e-06,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.110776387155056,
"step": 4100,
"valid_targets_mean": 4066.8,
"valid_targets_min": 633
},
{
"epoch": 5.89863407620417,
"grad_norm": 0.5530260841245102,
"learning_rate": 2.9531903091759464e-06,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11539137363433838,
"step": 4105,
"valid_targets_mean": 3571.0,
"valid_targets_min": 667
},
{
"epoch": 5.905823148813803,
"grad_norm": 0.49404735005998257,
"learning_rate": 2.915822326574205e-06,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09268874675035477,
"step": 4110,
"valid_targets_mean": 3558.6,
"valid_targets_min": 814
},
{
"epoch": 5.913012221423436,
"grad_norm": 0.5418163287700767,
"learning_rate": 2.8786736710631547e-06,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08183282613754272,
"step": 4115,
"valid_targets_mean": 2856.6,
"valid_targets_min": 529
},
{
"epoch": 5.9202012940330695,
"grad_norm": 0.5829105600425594,
"learning_rate": 2.841744819558141e-06,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1069040447473526,
"step": 4120,
"valid_targets_mean": 3141.1,
"valid_targets_min": 467
},
{
"epoch": 5.927390366642703,
"grad_norm": 0.5522333370692242,
"learning_rate": 2.8050362461526614e-06,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10800863802433014,
"step": 4125,
"valid_targets_mean": 3894.9,
"valid_targets_min": 797
},
{
"epoch": 5.934579439252336,
"grad_norm": 0.5126538599484419,
"learning_rate": 2.7685484221122847e-06,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1306709349155426,
"step": 4130,
"valid_targets_mean": 4314.8,
"valid_targets_min": 840
},
{
"epoch": 5.941768511861969,
"grad_norm": 0.5394517626708155,
"learning_rate": 2.7322818158685847e-06,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13361993432044983,
"step": 4135,
"valid_targets_mean": 3994.2,
"valid_targets_min": 853
},
{
"epoch": 5.948957584471604,
"grad_norm": 0.5359612939529111,
"learning_rate": 2.696236893013138e-06,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10245585441589355,
"step": 4140,
"valid_targets_mean": 3500.2,
"valid_targets_min": 649
},
{
"epoch": 5.956146657081236,
"grad_norm": 0.5688862266244793,
"learning_rate": 2.660414116291543e-06,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09202219545841217,
"step": 4145,
"valid_targets_mean": 2825.6,
"valid_targets_min": 611
},
{
"epoch": 5.96333572969087,
"grad_norm": 0.5610739413081085,
"learning_rate": 2.624813945597493e-06,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12422355264425278,
"step": 4150,
"valid_targets_mean": 4198.4,
"valid_targets_min": 700
},
{
"epoch": 5.9705248023005035,
"grad_norm": 0.5885410928110363,
"learning_rate": 2.5894368379668367e-06,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09310132265090942,
"step": 4155,
"valid_targets_mean": 2653.9,
"valid_targets_min": 691
},
{
"epoch": 5.977713874910137,
"grad_norm": 0.5635217064321498,
"learning_rate": 2.5542832475717605e-06,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13913258910179138,
"step": 4160,
"valid_targets_mean": 4385.0,
"valid_targets_min": 867
},
{
"epoch": 5.98490294751977,
"grad_norm": 0.48587755558221085,
"learning_rate": 2.5193536257149045e-06,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0926017239689827,
"step": 4165,
"valid_targets_mean": 3001.0,
"valid_targets_min": 889
},
{
"epoch": 5.9920920201294035,
"grad_norm": 0.5248853589772831,
"learning_rate": 2.484648420823621e-06,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11225050687789917,
"step": 4170,
"valid_targets_mean": 3894.8,
"valid_targets_min": 785
},
{
"epoch": 5.999281092739037,
"grad_norm": 0.49185549380354215,
"learning_rate": 2.4501680784441704e-06,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12695342302322388,
"step": 4175,
"valid_targets_mean": 4756.8,
"valid_targets_min": 851
},
{
"epoch": 6.005751258087707,
"grad_norm": 0.5895294664188037,
"learning_rate": 2.415913041236033e-06,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1118449717760086,
"step": 4180,
"valid_targets_mean": 4720.0,
"valid_targets_min": 3732
},
{
"epoch": 6.01294033069734,
"grad_norm": 0.6638987983800019,
"learning_rate": 2.3818837489662096e-06,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10860610008239746,
"step": 4185,
"valid_targets_mean": 2938.6,
"valid_targets_min": 773
},
{
"epoch": 6.020129403306973,
"grad_norm": 0.47545987837037096,
"learning_rate": 2.348080638503596e-06,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12051060050725937,
"step": 4190,
"valid_targets_mean": 4825.9,
"valid_targets_min": 702
},
{
"epoch": 6.027318475916607,
"grad_norm": 0.511588230010411,
"learning_rate": 2.3145041438133476e-06,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11961148679256439,
"step": 4195,
"valid_targets_mean": 4777.9,
"valid_targets_min": 3944
},
{
"epoch": 6.03450754852624,
"grad_norm": 0.553898288205841,
"learning_rate": 2.2811546959513196e-06,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13163530826568604,
"step": 4200,
"valid_targets_mean": 4873.9,
"valid_targets_min": 3944
},
{
"epoch": 6.041696621135873,
"grad_norm": 0.5899270631407394,
"learning_rate": 2.24803272305854e-06,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1202486902475357,
"step": 4205,
"valid_targets_mean": 3210.9,
"valid_targets_min": 597
},
{
"epoch": 6.048885693745507,
"grad_norm": 0.5810648705314886,
"learning_rate": 2.21513865035571e-06,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10933034867048264,
"step": 4210,
"valid_targets_mean": 3725.1,
"valid_targets_min": 601
},
{
"epoch": 6.05607476635514,
"grad_norm": 0.449972261249417,
"learning_rate": 2.1824729001377396e-06,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10579677671194077,
"step": 4215,
"valid_targets_mean": 4484.1,
"valid_targets_min": 3859
},
{
"epoch": 6.063263838964773,
"grad_norm": 0.4943133972872266,
"learning_rate": 2.150035891768323e-06,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13363003730773926,
"step": 4220,
"valid_targets_mean": 4613.4,
"valid_targets_min": 678
},
{
"epoch": 6.070452911574407,
"grad_norm": 0.5929568384137042,
"learning_rate": 2.1178280416745743e-06,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06701067090034485,
"step": 4225,
"valid_targets_mean": 1870.5,
"valid_targets_min": 446
},
{
"epoch": 6.07764198418404,
"grad_norm": 0.4803255814125173,
"learning_rate": 2.0858497633416565e-06,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09893548488616943,
"step": 4230,
"valid_targets_mean": 3892.6,
"valid_targets_min": 670
},
{
"epoch": 6.084831056793673,
"grad_norm": 0.6263462306661182,
"learning_rate": 2.0541014673074898e-06,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13514085114002228,
"step": 4235,
"valid_targets_mean": 4169.0,
"valid_targets_min": 728
},
{
"epoch": 6.092020129403307,
"grad_norm": 0.5421931016830664,
"learning_rate": 2.0225835611574697e-06,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11666776239871979,
"step": 4240,
"valid_targets_mean": 3620.8,
"valid_targets_min": 915
},
{
"epoch": 6.099209202012941,
"grad_norm": 0.4857697103944299,
"learning_rate": 1.9912964495192533e-06,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11697093397378922,
"step": 4245,
"valid_targets_mean": 5469.8,
"valid_targets_min": 640
},
{
"epoch": 6.106398274622574,
"grad_norm": 0.5323926029594881,
"learning_rate": 1.9602405340575446e-06,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10784275829792023,
"step": 4250,
"valid_targets_mean": 3823.8,
"valid_targets_min": 825
},
{
"epoch": 6.113587347232207,
"grad_norm": 0.5447888444803873,
"learning_rate": 1.929416213468942e-06,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10931412875652313,
"step": 4255,
"valid_targets_mean": 3607.9,
"valid_targets_min": 609
},
{
"epoch": 6.120776419841841,
"grad_norm": 0.6144296819100742,
"learning_rate": 1.8988238834768235e-06,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12556231021881104,
"step": 4260,
"valid_targets_mean": 3070.2,
"valid_targets_min": 534
},
{
"epoch": 6.127965492451474,
"grad_norm": 0.49482382131724245,
"learning_rate": 1.8684639368262792e-06,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340388059616089,
"step": 4265,
"valid_targets_mean": 5229.5,
"valid_targets_min": 4362
},
{
"epoch": 6.135154565061107,
"grad_norm": 0.5827050871510197,
"learning_rate": 1.8383367632790384e-06,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12392894178628922,
"step": 4270,
"valid_targets_mean": 3390.2,
"valid_targets_min": 565
},
{
"epoch": 6.1423436376707405,
"grad_norm": 0.5131318427074524,
"learning_rate": 1.8084427496084967e-06,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1041579395532608,
"step": 4275,
"valid_targets_mean": 3940.1,
"valid_targets_min": 742
},
{
"epoch": 6.149532710280374,
"grad_norm": 0.5963777062849123,
"learning_rate": 1.7787822795947262e-06,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09274083375930786,
"step": 4280,
"valid_targets_mean": 2919.9,
"valid_targets_min": 717
},
{
"epoch": 6.156721782890007,
"grad_norm": 0.49582307100103684,
"learning_rate": 1.7493557340195754e-06,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09546741843223572,
"step": 4285,
"valid_targets_mean": 4019.0,
"valid_targets_min": 934
},
{
"epoch": 6.1639108554996405,
"grad_norm": 0.4871415848643614,
"learning_rate": 1.7201634906617504e-06,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10446576774120331,
"step": 4290,
"valid_targets_mean": 4068.0,
"valid_targets_min": 649
},
{
"epoch": 6.171099928109274,
"grad_norm": 0.47120731528371945,
"learning_rate": 1.6912059242919853e-06,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11221934854984283,
"step": 4295,
"valid_targets_mean": 4832.8,
"valid_targets_min": 895
},
{
"epoch": 6.178289000718907,
"grad_norm": 0.4965531368094695,
"learning_rate": 1.6624834066682248e-06,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09528857469558716,
"step": 4300,
"valid_targets_mean": 3653.1,
"valid_targets_min": 748
},
{
"epoch": 6.18547807332854,
"grad_norm": 0.5756851241381141,
"learning_rate": 1.6339963065308539e-06,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08201570063829422,
"step": 4305,
"valid_targets_mean": 2631.0,
"valid_targets_min": 710
},
{
"epoch": 6.192667145938174,
"grad_norm": 0.5002106473544778,
"learning_rate": 1.6057449895979616e-06,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09970113635063171,
"step": 4310,
"valid_targets_mean": 3362.1,
"valid_targets_min": 691
},
{
"epoch": 6.199856218547807,
"grad_norm": 0.596931111317232,
"learning_rate": 1.5777298185606428e-06,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14602990448474884,
"step": 4315,
"valid_targets_mean": 4108.9,
"valid_targets_min": 1363
},
{
"epoch": 6.20704529115744,
"grad_norm": 0.538595523809706,
"learning_rate": 1.5499511530783462e-06,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12626773118972778,
"step": 4320,
"valid_targets_mean": 3403.0,
"valid_targets_min": 601
},
{
"epoch": 6.2142343637670745,
"grad_norm": 0.5490331377416214,
"learning_rate": 1.5224093497742654e-06,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11536562442779541,
"step": 4325,
"valid_targets_mean": 3286.5,
"valid_targets_min": 732
},
{
"epoch": 6.221423436376708,
"grad_norm": 0.539453466902596,
"learning_rate": 1.4951047622307413e-06,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15311205387115479,
"step": 4330,
"valid_targets_mean": 4828.9,
"valid_targets_min": 685
},
{
"epoch": 6.228612508986341,
"grad_norm": 0.5966313956547638,
"learning_rate": 1.4680377409847314e-06,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12395937740802765,
"step": 4335,
"valid_targets_mean": 3536.1,
"valid_targets_min": 713
},
{
"epoch": 6.235801581595974,
"grad_norm": 0.6171088156882476,
"learning_rate": 1.4412086335233255e-06,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13875176012516022,
"step": 4340,
"valid_targets_mean": 3610.2,
"valid_targets_min": 595
},
{
"epoch": 6.242990654205608,
"grad_norm": 0.5098548922882871,
"learning_rate": 1.4146177842792573e-06,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10508402436971664,
"step": 4345,
"valid_targets_mean": 3578.6,
"valid_targets_min": 753
},
{
"epoch": 6.250179726815241,
"grad_norm": 0.5567296804680034,
"learning_rate": 1.388265534626496e-06,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11976335197687149,
"step": 4350,
"valid_targets_mean": 4137.0,
"valid_targets_min": 558
},
{
"epoch": 6.257368799424874,
"grad_norm": 0.5039084294745627,
"learning_rate": 1.3621522228758676e-06,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09727634489536285,
"step": 4355,
"valid_targets_mean": 3437.0,
"valid_targets_min": 521
},
{
"epoch": 6.264557872034508,
"grad_norm": 0.5493758228180413,
"learning_rate": 1.336278184270714e-06,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13206574320793152,
"step": 4360,
"valid_targets_mean": 4421.5,
"valid_targets_min": 3544
},
{
"epoch": 6.271746944644141,
"grad_norm": 0.5749472389885733,
"learning_rate": 1.3106437509825676e-06,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11927582323551178,
"step": 4365,
"valid_targets_mean": 3679.4,
"valid_targets_min": 591
},
{
"epoch": 6.278936017253774,
"grad_norm": 0.5863167521975554,
"learning_rate": 1.285249252106915e-06,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09201674908399582,
"step": 4370,
"valid_targets_mean": 2855.1,
"valid_targets_min": 620
},
{
"epoch": 6.286125089863408,
"grad_norm": 0.5928713895291766,
"learning_rate": 1.2600950136589463e-06,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11213717609643936,
"step": 4375,
"valid_targets_mean": 3264.9,
"valid_targets_min": 582
},
{
"epoch": 6.293314162473041,
"grad_norm": 0.7070213599440965,
"learning_rate": 1.2351813585693995e-06,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07634206861257553,
"step": 4380,
"valid_targets_mean": 1711.0,
"valid_targets_min": 619
},
{
"epoch": 6.300503235082674,
"grad_norm": 0.6228414357157461,
"learning_rate": 1.2105086066803783e-06,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11248739063739777,
"step": 4385,
"valid_targets_mean": 3012.6,
"valid_targets_min": 685
},
{
"epoch": 6.3076923076923075,
"grad_norm": 0.5643565877084489,
"learning_rate": 1.1860770747412853e-06,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.113135427236557,
"step": 4390,
"valid_targets_mean": 2834.9,
"valid_targets_min": 603
},
{
"epoch": 6.314881380301941,
"grad_norm": 0.6000792505033019,
"learning_rate": 1.161887076404713e-06,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1297518014907837,
"step": 4395,
"valid_targets_mean": 3398.4,
"valid_targets_min": 721
},
{
"epoch": 6.322070452911574,
"grad_norm": 0.5197738471357597,
"learning_rate": 1.1379389222224612e-06,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12117072939872742,
"step": 4400,
"valid_targets_mean": 3815.1,
"valid_targets_min": 588
},
{
"epoch": 6.329259525521207,
"grad_norm": 0.6157655100543539,
"learning_rate": 1.1142329196415158e-06,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11843574792146683,
"step": 4405,
"valid_targets_mean": 3207.4,
"valid_targets_min": 736
},
{
"epoch": 6.336448598130841,
"grad_norm": 0.6007875421280104,
"learning_rate": 1.0907693730001156e-06,
"loss": 0.2102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11485160887241364,
"step": 4410,
"valid_targets_mean": 3385.8,
"valid_targets_min": 544
},
{
"epoch": 6.343637670740474,
"grad_norm": 0.5909221142624015,
"learning_rate": 1.0675485835238453e-06,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11618539690971375,
"step": 4415,
"valid_targets_mean": 3535.8,
"valid_targets_min": 656
},
{
"epoch": 6.350826743350108,
"grad_norm": 0.5883536230905861,
"learning_rate": 1.0445708493217732e-06,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16777461767196655,
"step": 4420,
"valid_targets_mean": 3526.5,
"valid_targets_min": 604
},
{
"epoch": 6.3580158159597415,
"grad_norm": 0.491586006809235,
"learning_rate": 1.0218364653826106e-06,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12006094306707382,
"step": 4425,
"valid_targets_mean": 4281.6,
"valid_targets_min": 1431
},
{
"epoch": 6.365204888569375,
"grad_norm": 0.4767502238781207,
"learning_rate": 9.993457235709325e-07,
"loss": 0.2205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10189913213253021,
"step": 4430,
"valid_targets_mean": 3844.6,
"valid_targets_min": 915
},
{
"epoch": 6.372393961179008,
"grad_norm": 0.5371473156112417,
"learning_rate": 9.770989126234287e-07,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11209119856357574,
"step": 4435,
"valid_targets_mean": 3499.1,
"valid_targets_min": 615
},
{
"epoch": 6.379583033788641,
"grad_norm": 0.6149664809993349,
"learning_rate": 9.550963181452121e-07,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10318882018327713,
"step": 4440,
"valid_targets_mean": 3142.6,
"valid_targets_min": 663
},
{
"epoch": 6.386772106398275,
"grad_norm": 0.5234090608011976,
"learning_rate": 9.333382226061216e-07,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11103767156600952,
"step": 4445,
"valid_targets_mean": 3792.0,
"valid_targets_min": 545
},
{
"epoch": 6.393961179007908,
"grad_norm": 0.5832363451984859,
"learning_rate": 9.118249053371176e-07,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12992234528064728,
"step": 4450,
"valid_targets_mean": 3576.0,
"valid_targets_min": 578
},
{
"epoch": 6.401150251617541,
"grad_norm": 0.4971374707007291,
"learning_rate": 8.905566425267009e-07,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11479949951171875,
"step": 4455,
"valid_targets_mean": 4383.1,
"valid_targets_min": 640
},
{
"epoch": 6.408339324227175,
"grad_norm": 0.5060142693629047,
"learning_rate": 8.695337072173448e-07,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10227428376674652,
"step": 4460,
"valid_targets_mean": 3275.5,
"valid_targets_min": 714
},
{
"epoch": 6.415528396836808,
"grad_norm": 0.5977172657593309,
"learning_rate": 8.487563693020063e-07,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10205759108066559,
"step": 4465,
"valid_targets_mean": 2500.6,
"valid_targets_min": 655
},
{
"epoch": 6.422717469446441,
"grad_norm": 0.5650433111300472,
"learning_rate": 8.282248955206573e-07,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11529181152582169,
"step": 4470,
"valid_targets_mean": 3392.5,
"valid_targets_min": 618
},
{
"epoch": 6.429906542056075,
"grad_norm": 0.5347555795795468,
"learning_rate": 8.079395494568643e-07,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10156741738319397,
"step": 4475,
"valid_targets_mean": 3383.0,
"valid_targets_min": 872
},
{
"epoch": 6.437095614665708,
"grad_norm": 0.4365670326267589,
"learning_rate": 7.879005915343918e-07,
"loss": 0.2146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1043374314904213,
"step": 4480,
"valid_targets_mean": 4653.4,
"valid_targets_min": 3482
},
{
"epoch": 6.444284687275341,
"grad_norm": 0.6426365264377848,
"learning_rate": 7.68108279013875e-07,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0819304957985878,
"step": 4485,
"valid_targets_mean": 2075.1,
"valid_targets_min": 552
},
{
"epoch": 6.4514737598849745,
"grad_norm": 0.5102964897343093,
"learning_rate": 7.485628659894994e-07,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11622590571641922,
"step": 4490,
"valid_targets_mean": 3854.1,
"valid_targets_min": 798
},
{
"epoch": 6.458662832494608,
"grad_norm": 0.8896510887896947,
"learning_rate": 7.292646033857642e-07,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12156560271978378,
"step": 4495,
"valid_targets_mean": 3445.5,
"valid_targets_min": 689
},
{
"epoch": 6.465851905104241,
"grad_norm": 0.5066774432966253,
"learning_rate": 7.102137389542285e-07,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09936122596263885,
"step": 4500,
"valid_targets_mean": 3640.1,
"valid_targets_min": 556
},
{
"epoch": 6.473040977713875,
"grad_norm": 0.48580434445087983,
"learning_rate": 6.914105172703634e-07,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10198426246643066,
"step": 4505,
"valid_targets_mean": 4095.1,
"valid_targets_min": 981
},
{
"epoch": 6.480230050323509,
"grad_norm": 0.5480915043210962,
"learning_rate": 6.728551797303806e-07,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11724647879600525,
"step": 4510,
"valid_targets_mean": 3779.5,
"valid_targets_min": 686
},
{
"epoch": 6.487419122933142,
"grad_norm": 0.4917565970472607,
"learning_rate": 6.545479645481668e-07,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09854386746883392,
"step": 4515,
"valid_targets_mean": 3022.0,
"valid_targets_min": 534
},
{
"epoch": 6.494608195542775,
"grad_norm": 0.5955056659476884,
"learning_rate": 6.364891067521894e-07,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14446298778057098,
"step": 4520,
"valid_targets_mean": 3898.5,
"valid_targets_min": 520
},
{
"epoch": 6.5017972681524085,
"grad_norm": 0.531573239442214,
"learning_rate": 6.186788381825115e-07,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10202017426490784,
"step": 4525,
"valid_targets_mean": 3164.8,
"valid_targets_min": 607
},
{
"epoch": 6.508986340762042,
"grad_norm": 0.5236595235106791,
"learning_rate": 6.011173874877907e-07,
"loss": 0.2256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0913836658000946,
"step": 4530,
"valid_targets_mean": 3510.1,
"valid_targets_min": 758
},
{
"epoch": 6.516175413371675,
"grad_norm": 0.5100939636244546,
"learning_rate": 5.838049801223666e-07,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12276538461446762,
"step": 4535,
"valid_targets_mean": 4939.5,
"valid_targets_min": 734
},
{
"epoch": 6.5233644859813085,
"grad_norm": 0.5928341800974949,
"learning_rate": 5.667418383433454e-07,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09597209841012955,
"step": 4540,
"valid_targets_mean": 2316.5,
"valid_targets_min": 571
},
{
"epoch": 6.530553558590942,
"grad_norm": 0.5147154688423627,
"learning_rate": 5.499281812077595e-07,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11607391387224197,
"step": 4545,
"valid_targets_mean": 4424.6,
"valid_targets_min": 582
},
{
"epoch": 6.537742631200575,
"grad_norm": 0.5729816597064707,
"learning_rate": 5.333642245697479e-07,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11833793669939041,
"step": 4550,
"valid_targets_mean": 4566.2,
"valid_targets_min": 3931
},
{
"epoch": 6.544931703810208,
"grad_norm": 0.6177362139918386,
"learning_rate": 5.170501810777962e-07,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12645436823368073,
"step": 4555,
"valid_targets_mean": 3126.6,
"valid_targets_min": 666
},
{
"epoch": 6.552120776419842,
"grad_norm": 0.6246368411360932,
"learning_rate": 5.009862601719895e-07,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12022657692432404,
"step": 4560,
"valid_targets_mean": 3312.2,
"valid_targets_min": 731
},
{
"epoch": 6.559309849029475,
"grad_norm": 0.5709298820469643,
"learning_rate": 4.851726680813352e-07,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12751153111457825,
"step": 4565,
"valid_targets_mean": 4387.9,
"valid_targets_min": 630
},
{
"epoch": 6.566498921639108,
"grad_norm": 0.597713035176386,
"learning_rate": 4.6960960782111764e-07,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12144911289215088,
"step": 4570,
"valid_targets_mean": 4570.9,
"valid_targets_min": 828
},
{
"epoch": 6.573687994248742,
"grad_norm": 0.5371421698345592,
"learning_rate": 4.5429727919028777e-07,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08236388862133026,
"step": 4575,
"valid_targets_mean": 2927.4,
"valid_targets_min": 639
},
{
"epoch": 6.580877066858375,
"grad_norm": 0.48311881472200036,
"learning_rate": 4.392358787688933e-07,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11492183804512024,
"step": 4580,
"valid_targets_mean": 4438.8,
"valid_targets_min": 546
},
{
"epoch": 6.588066139468008,
"grad_norm": 0.5324096131254584,
"learning_rate": 4.2442559991555666e-07,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10867210477590561,
"step": 4585,
"valid_targets_mean": 4227.9,
"valid_targets_min": 767
},
{
"epoch": 6.595255212077642,
"grad_norm": 0.5806558853032571,
"learning_rate": 4.098666327650036e-07,
"loss": 0.2273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12176599353551865,
"step": 4590,
"valid_targets_mean": 4184.5,
"valid_targets_min": 768
},
{
"epoch": 6.602444284687275,
"grad_norm": 0.5316832508972936,
"learning_rate": 3.955591642256118e-07,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09368228912353516,
"step": 4595,
"valid_targets_mean": 3312.2,
"valid_targets_min": 617
},
{
"epoch": 6.609633357296909,
"grad_norm": 0.5262503581637803,
"learning_rate": 3.8150337797701274e-07,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12923449277877808,
"step": 4600,
"valid_targets_mean": 4870.6,
"valid_targets_min": 637
},
{
"epoch": 6.616822429906542,
"grad_norm": 0.5198765305609072,
"learning_rate": 3.67699454467727e-07,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09299536049365997,
"step": 4605,
"valid_targets_mean": 4086.0,
"valid_targets_min": 691
},
{
"epoch": 6.624011502516176,
"grad_norm": 0.5294711658533326,
"learning_rate": 3.5414757091287055e-07,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1437724232673645,
"step": 4610,
"valid_targets_mean": 5623.2,
"valid_targets_min": 4224
},
{
"epoch": 6.631200575125809,
"grad_norm": 0.5316860873672942,
"learning_rate": 3.408479012918475e-07,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11999592185020447,
"step": 4615,
"valid_targets_mean": 4838.4,
"valid_targets_min": 719
},
{
"epoch": 6.638389647735442,
"grad_norm": 0.527365776930916,
"learning_rate": 3.2780061634615e-07,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0915064588189125,
"step": 4620,
"valid_targets_mean": 3768.5,
"valid_targets_min": 671
},
{
"epoch": 6.645578720345076,
"grad_norm": 0.5476426776018154,
"learning_rate": 3.1500588357713745e-07,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15225091576576233,
"step": 4625,
"valid_targets_mean": 4842.1,
"valid_targets_min": 1040
},
{
"epoch": 6.652767792954709,
"grad_norm": 0.6528164431079474,
"learning_rate": 3.024638672439006e-07,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10779650509357452,
"step": 4630,
"valid_targets_mean": 2673.1,
"valid_targets_min": 689
},
{
"epoch": 6.659956865564342,
"grad_norm": 0.5231166358844416,
"learning_rate": 2.901747283611545e-07,
"loss": 0.2094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10894091427326202,
"step": 4635,
"valid_targets_mean": 4211.9,
"valid_targets_min": 758
},
{
"epoch": 6.6671459381739755,
"grad_norm": 0.46431337768126324,
"learning_rate": 2.7813862469716403e-07,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11026604473590851,
"step": 4640,
"valid_targets_mean": 4567.1,
"valid_targets_min": 4060
},
{
"epoch": 6.674335010783609,
"grad_norm": 0.4647171653285355,
"learning_rate": 2.663557107717196e-07,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11128712445497513,
"step": 4645,
"valid_targets_mean": 4858.0,
"valid_targets_min": 604
},
{
"epoch": 6.681524083393242,
"grad_norm": 0.5449440560939603,
"learning_rate": 2.5482613785416277e-07,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1023380309343338,
"step": 4650,
"valid_targets_mean": 3129.8,
"valid_targets_min": 653
},
{
"epoch": 6.688713156002875,
"grad_norm": 0.5273355227723932,
"learning_rate": 2.435500539614277e-07,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14378316700458527,
"step": 4655,
"valid_targets_mean": 4260.0,
"valid_targets_min": 610
},
{
"epoch": 6.695902228612509,
"grad_norm": 0.4760788362645504,
"learning_rate": 2.3252760385615858e-07,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09157054871320724,
"step": 4660,
"valid_targets_mean": 4021.9,
"valid_targets_min": 515
},
{
"epoch": 6.703091301222142,
"grad_norm": 0.5599885016265596,
"learning_rate": 2.2175892904483743e-07,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09934373944997787,
"step": 4665,
"valid_targets_mean": 3322.4,
"valid_targets_min": 736
},
{
"epoch": 6.710280373831775,
"grad_norm": 0.6374298891898735,
"learning_rate": 2.112441677759769e-07,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15255284309387207,
"step": 4670,
"valid_targets_mean": 3333.6,
"valid_targets_min": 529
},
{
"epoch": 6.7174694464414095,
"grad_norm": 0.49118289338422527,
"learning_rate": 2.0098345503833716e-07,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10941498726606369,
"step": 4675,
"valid_targets_mean": 4543.6,
"valid_targets_min": 1057
},
{
"epoch": 6.724658519051042,
"grad_norm": 0.5211196754678628,
"learning_rate": 1.9097692255919843e-07,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07783547788858414,
"step": 4680,
"valid_targets_mean": 2769.2,
"valid_targets_min": 612
},
{
"epoch": 6.731847591660676,
"grad_norm": 0.4639278461542733,
"learning_rate": 1.8122469880267335e-07,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0822891891002655,
"step": 4685,
"valid_targets_mean": 3433.8,
"valid_targets_min": 812
},
{
"epoch": 6.7390366642703095,
"grad_norm": 0.5699109580239698,
"learning_rate": 1.717269089680462e-07,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13950425386428833,
"step": 4690,
"valid_targets_mean": 3992.4,
"valid_targets_min": 440
},
{
"epoch": 6.746225736879943,
"grad_norm": 0.5247787380613426,
"learning_rate": 1.624836749881742e-07,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10433037579059601,
"step": 4695,
"valid_targets_mean": 4130.0,
"valid_targets_min": 722
},
{
"epoch": 6.753414809489576,
"grad_norm": 0.5002929707259851,
"learning_rate": 1.5349511552792406e-07,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11657604575157166,
"step": 4700,
"valid_targets_mean": 4010.6,
"valid_targets_min": 645
},
{
"epoch": 6.760603882099209,
"grad_norm": 0.5473486191985781,
"learning_rate": 1.4476134598263801e-07,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10951299965381622,
"step": 4705,
"valid_targets_mean": 3421.9,
"valid_targets_min": 775
},
{
"epoch": 6.767792954708843,
"grad_norm": 0.5364229068076471,
"learning_rate": 1.362824784766681e-07,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14374537765979767,
"step": 4710,
"valid_targets_mean": 4612.1,
"valid_targets_min": 3213
},
{
"epoch": 6.774982027318476,
"grad_norm": 0.4971300029350325,
"learning_rate": 1.2805862186191952e-07,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11811932921409607,
"step": 4715,
"valid_targets_mean": 4107.0,
"valid_targets_min": 1264
},
{
"epoch": 6.782171099928109,
"grad_norm": 0.601778889503626,
"learning_rate": 1.200898817164631e-07,
"loss": 0.2231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13035139441490173,
"step": 4720,
"valid_targets_mean": 4560.2,
"valid_targets_min": 543
},
{
"epoch": 6.789360172537743,
"grad_norm": 0.5329664913979177,
"learning_rate": 1.1237636034318045e-07,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09042935818433762,
"step": 4725,
"valid_targets_mean": 2884.6,
"valid_targets_min": 579
},
{
"epoch": 6.796549245147376,
"grad_norm": 0.5228200204151616,
"learning_rate": 1.0491815676845207e-07,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12473177909851074,
"step": 4730,
"valid_targets_mean": 4629.6,
"valid_targets_min": 3120
},
{
"epoch": 6.803738317757009,
"grad_norm": 0.5690118973711813,
"learning_rate": 9.771536674087145e-08,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08270010352134705,
"step": 4735,
"valid_targets_mean": 3209.2,
"valid_targets_min": 765
},
{
"epoch": 6.8109273903666425,
"grad_norm": 0.5794816335254488,
"learning_rate": 9.076808273003724e-08,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10203064233064651,
"step": 4740,
"valid_targets_mean": 3122.9,
"valid_targets_min": 471
},
{
"epoch": 6.818116462976276,
"grad_norm": 0.547427353885318,
"learning_rate": 8.407639392534972e-08,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0994785875082016,
"step": 4745,
"valid_targets_mean": 2774.4,
"valid_targets_min": 666
},
{
"epoch": 6.825305535585909,
"grad_norm": 0.5138980608440111,
"learning_rate": 7.764038623487403e-08,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11008846759796143,
"step": 4750,
"valid_targets_mean": 4515.4,
"valid_targets_min": 3798
},
{
"epoch": 6.832494608195542,
"grad_norm": 0.5818429652487563,
"learning_rate": 7.146014228423648e-08,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11513659358024597,
"step": 4755,
"valid_targets_mean": 3747.6,
"valid_targets_min": 756
},
{
"epoch": 6.839683680805176,
"grad_norm": 0.5618762340348782,
"learning_rate": 6.553574141555442e-08,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1377660632133484,
"step": 4760,
"valid_targets_mean": 4695.5,
"valid_targets_min": 830
},
{
"epoch": 6.846872753414809,
"grad_norm": 0.6855689303799838,
"learning_rate": 5.98672596864347e-08,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1489717960357666,
"step": 4765,
"valid_targets_mean": 5110.5,
"valid_targets_min": 3940
},
{
"epoch": 6.854061826024443,
"grad_norm": 0.5164135363567788,
"learning_rate": 5.445476986898568e-08,
"loss": 0.2193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09690165519714355,
"step": 4770,
"valid_targets_mean": 3323.0,
"valid_targets_min": 745
},
{
"epoch": 6.861250898634077,
"grad_norm": 0.5218845429859494,
"learning_rate": 4.929834144888013e-08,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11343638598918915,
"step": 4775,
"valid_targets_mean": 3724.2,
"valid_targets_min": 545
},
{
"epoch": 6.86843997124371,
"grad_norm": 0.5261894149495684,
"learning_rate": 4.439804062447373e-08,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13848835229873657,
"step": 4780,
"valid_targets_mean": 4062.4,
"valid_targets_min": 515
},
{
"epoch": 6.875629043853343,
"grad_norm": 0.5845958694842275,
"learning_rate": 3.9753930305950204e-08,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08328050374984741,
"step": 4785,
"valid_targets_mean": 2377.4,
"valid_targets_min": 486
},
{
"epoch": 6.8828181164629765,
"grad_norm": 0.5408789060985649,
"learning_rate": 3.536607011451088e-08,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10192709416151047,
"step": 4790,
"valid_targets_mean": 3126.0,
"valid_targets_min": 650
},
{
"epoch": 6.89000718907261,
"grad_norm": 0.5731456185915917,
"learning_rate": 3.123451638161079e-08,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09156908094882965,
"step": 4795,
"valid_targets_mean": 3015.9,
"valid_targets_min": 483
},
{
"epoch": 6.897196261682243,
"grad_norm": 0.5854299367435224,
"learning_rate": 2.7359322148237112e-08,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11642911285161972,
"step": 4800,
"valid_targets_mean": 3307.0,
"valid_targets_min": 556
},
{
"epoch": 6.904385334291876,
"grad_norm": 0.5763256439747025,
"learning_rate": 2.374053716422964e-08,
"loss": 0.219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10047812759876251,
"step": 4805,
"valid_targets_mean": 3457.4,
"valid_targets_min": 854
},
{
"epoch": 6.91157440690151,
"grad_norm": 0.5585836434639017,
"learning_rate": 2.0378207887639113e-08,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13827770948410034,
"step": 4810,
"valid_targets_mean": 3833.6,
"valid_targets_min": 691
},
{
"epoch": 6.918763479511143,
"grad_norm": 0.5021673769155096,
"learning_rate": 1.7272377484127688e-08,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09062834084033966,
"step": 4815,
"valid_targets_mean": 3467.6,
"valid_targets_min": 554
},
{
"epoch": 6.925952552120776,
"grad_norm": 0.5420506057791676,
"learning_rate": 1.4423085826427152e-08,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1145763099193573,
"step": 4820,
"valid_targets_mean": 3325.9,
"valid_targets_min": 450
},
{
"epoch": 6.93314162473041,
"grad_norm": 0.5429716282374907,
"learning_rate": 1.1830369493808225e-08,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0795266330242157,
"step": 4825,
"valid_targets_mean": 2546.1,
"valid_targets_min": 374
},
{
"epoch": 6.940330697340043,
"grad_norm": 0.48748914177526553,
"learning_rate": 9.49426177163204e-09,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494419127702713,
"step": 4830,
"valid_targets_mean": 6738.9,
"valid_targets_min": 3612
},
{
"epoch": 6.947519769949676,
"grad_norm": 0.5597403208591729,
"learning_rate": 7.414792650901614e-09,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0868077427148819,
"step": 4835,
"valid_targets_mean": 3310.8,
"valid_targets_min": 678
},
{
"epoch": 6.9547088425593095,
"grad_norm": 0.49658819468141957,
"learning_rate": 5.591988827893247e-09,
"loss": 0.2264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08313396573066711,
"step": 4840,
"valid_targets_mean": 3697.8,
"valid_targets_min": 999
},
{
"epoch": 6.961897915168943,
"grad_norm": 0.6028617506588944,
"learning_rate": 4.025873703810135e-09,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11810679733753204,
"step": 4845,
"valid_targets_mean": 3725.8,
"valid_targets_min": 684
},
{
"epoch": 6.969086987778576,
"grad_norm": 0.5726678330735068,
"learning_rate": 2.7164673844737312e-09,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13200724124908447,
"step": 4850,
"valid_targets_mean": 4098.9,
"valid_targets_min": 575
},
{
"epoch": 6.97627606038821,
"grad_norm": 0.6080274682036577,
"learning_rate": 1.6637866800750524e-09,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12892693281173706,
"step": 4855,
"valid_targets_mean": 4071.0,
"valid_targets_min": 314
},
{
"epoch": 6.983465132997844,
"grad_norm": 0.5745138575411652,
"learning_rate": 8.678451049548564e-10,
"loss": 0.223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12005611509084702,
"step": 4860,
"valid_targets_mean": 3703.9,
"valid_targets_min": 816
},
{
"epoch": 6.990654205607477,
"grad_norm": 0.6098451214662762,
"learning_rate": 3.286528774326669e-10,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12149364501237869,
"step": 4865,
"valid_targets_mean": 3561.4,
"valid_targets_min": 927
},
{
"epoch": 6.99784327821711,
"grad_norm": 0.5050849963191119,
"learning_rate": 4.621691966688602e-11,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11706176400184631,
"step": 4870,
"valid_targets_mean": 4379.5,
"valid_targets_min": 835
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101859748363495,
"step": 4872,
"total_flos": 2.402936079087829e+18,
"train_loss": 0.2685813971707974,
"train_runtime": 61451.9039,
"train_samples_per_second": 1.267,
"train_steps_per_second": 0.079,
"valid_targets_mean": 2883.4,
"valid_targets_min": 615
}
],
"logging_steps": 5,
"max_steps": 4872,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 2.402936079087829e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}