Files
a1-stack_csharp/trainer_state.json
ModelHub XC 18855f17eb 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-stack_csharp
Source: Original Platform
2026-05-04 04:13:52 +08:00

10465 lines
290 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4739,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007385524372230428,
"grad_norm": 19.97872360716285,
"learning_rate": 3.3755274261603377e-07,
"loss": 0.624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7236873507499695,
"step": 5,
"valid_targets_mean": 4191.2,
"valid_targets_min": 560
},
{
"epoch": 0.014771048744460856,
"grad_norm": 16.297750328748872,
"learning_rate": 7.59493670886076e-07,
"loss": 0.6447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6396403312683105,
"step": 10,
"valid_targets_mean": 3906.9,
"valid_targets_min": 617
},
{
"epoch": 0.022156573116691284,
"grad_norm": 13.56762186389351,
"learning_rate": 1.1814345991561182e-06,
"loss": 0.6682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5922929048538208,
"step": 15,
"valid_targets_mean": 5468.2,
"valid_targets_min": 573
},
{
"epoch": 0.029542097488921712,
"grad_norm": 11.653889962740626,
"learning_rate": 1.6033755274261605e-06,
"loss": 0.5585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5627623796463013,
"step": 20,
"valid_targets_mean": 4871.1,
"valid_targets_min": 581
},
{
"epoch": 0.03692762186115214,
"grad_norm": 8.00562953617597,
"learning_rate": 2.0253164556962026e-06,
"loss": 0.5008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5002298355102539,
"step": 25,
"valid_targets_mean": 4081.2,
"valid_targets_min": 400
},
{
"epoch": 0.04431314623338257,
"grad_norm": 4.397412308851758,
"learning_rate": 2.447257383966245e-06,
"loss": 0.4932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4381677806377411,
"step": 30,
"valid_targets_mean": 5501.4,
"valid_targets_min": 638
},
{
"epoch": 0.051698670605613,
"grad_norm": 2.3819720550400656,
"learning_rate": 2.8691983122362873e-06,
"loss": 0.4548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4095567464828491,
"step": 35,
"valid_targets_mean": 6018.8,
"valid_targets_min": 479
},
{
"epoch": 0.059084194977843424,
"grad_norm": 1.5356961908394742,
"learning_rate": 3.2911392405063294e-06,
"loss": 0.4411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3926240801811218,
"step": 40,
"valid_targets_mean": 4400.6,
"valid_targets_min": 517
},
{
"epoch": 0.06646971935007386,
"grad_norm": 1.0870293491792131,
"learning_rate": 3.713080168776372e-06,
"loss": 0.4433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.417349636554718,
"step": 45,
"valid_targets_mean": 5836.1,
"valid_targets_min": 762
},
{
"epoch": 0.07385524372230429,
"grad_norm": 0.943385047160246,
"learning_rate": 4.135021097046414e-06,
"loss": 0.4154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41143539547920227,
"step": 50,
"valid_targets_mean": 5084.6,
"valid_targets_min": 639
},
{
"epoch": 0.08124076809453472,
"grad_norm": 1.011998448398478,
"learning_rate": 4.556962025316456e-06,
"loss": 0.4151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39654070138931274,
"step": 55,
"valid_targets_mean": 5247.8,
"valid_targets_min": 681
},
{
"epoch": 0.08862629246676514,
"grad_norm": 0.686487046735958,
"learning_rate": 4.978902953586498e-06,
"loss": 0.3792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33487510681152344,
"step": 60,
"valid_targets_mean": 5221.6,
"valid_targets_min": 490
},
{
"epoch": 0.09601181683899557,
"grad_norm": 0.571553738713959,
"learning_rate": 5.40084388185654e-06,
"loss": 0.3743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3575626313686371,
"step": 65,
"valid_targets_mean": 6041.3,
"valid_targets_min": 618
},
{
"epoch": 0.103397341211226,
"grad_norm": 0.49365785429432335,
"learning_rate": 5.8227848101265824e-06,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30460304021835327,
"step": 70,
"valid_targets_mean": 5298.4,
"valid_targets_min": 535
},
{
"epoch": 0.11078286558345643,
"grad_norm": 0.5050364830057085,
"learning_rate": 6.244725738396625e-06,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3081740140914917,
"step": 75,
"valid_targets_mean": 5255.7,
"valid_targets_min": 652
},
{
"epoch": 0.11816838995568685,
"grad_norm": 0.5226990318037864,
"learning_rate": 6.666666666666667e-06,
"loss": 0.3904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3145563006401062,
"step": 80,
"valid_targets_mean": 4663.9,
"valid_targets_min": 392
},
{
"epoch": 0.1255539143279173,
"grad_norm": 0.4881100768231626,
"learning_rate": 7.08860759493671e-06,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30497312545776367,
"step": 85,
"valid_targets_mean": 5632.1,
"valid_targets_min": 719
},
{
"epoch": 0.1329394387001477,
"grad_norm": 0.5237726651638548,
"learning_rate": 7.510548523206752e-06,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3278190791606903,
"step": 90,
"valid_targets_mean": 6220.0,
"valid_targets_min": 751
},
{
"epoch": 0.14032496307237813,
"grad_norm": 0.4650280516019618,
"learning_rate": 7.932489451476793e-06,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28953981399536133,
"step": 95,
"valid_targets_mean": 5031.3,
"valid_targets_min": 642
},
{
"epoch": 0.14771048744460857,
"grad_norm": 0.46371951812182943,
"learning_rate": 8.354430379746837e-06,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33909645676612854,
"step": 100,
"valid_targets_mean": 6196.9,
"valid_targets_min": 545
},
{
"epoch": 0.155096011816839,
"grad_norm": 0.4568538569230339,
"learning_rate": 8.776371308016879e-06,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2957189679145813,
"step": 105,
"valid_targets_mean": 6063.0,
"valid_targets_min": 584
},
{
"epoch": 0.16248153618906944,
"grad_norm": 0.4578520750020651,
"learning_rate": 9.198312236286921e-06,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29967236518859863,
"step": 110,
"valid_targets_mean": 6171.0,
"valid_targets_min": 540
},
{
"epoch": 0.16986706056129985,
"grad_norm": 0.4955996123561873,
"learning_rate": 9.620253164556963e-06,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830328941345215,
"step": 115,
"valid_targets_mean": 4840.9,
"valid_targets_min": 454
},
{
"epoch": 0.17725258493353027,
"grad_norm": 0.5471230185393541,
"learning_rate": 1.0042194092827005e-05,
"loss": 0.3219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36016958951950073,
"step": 120,
"valid_targets_mean": 4376.1,
"valid_targets_min": 605
},
{
"epoch": 0.18463810930576072,
"grad_norm": 0.5075473057243887,
"learning_rate": 1.0464135021097049e-05,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.314586877822876,
"step": 125,
"valid_targets_mean": 4974.8,
"valid_targets_min": 615
},
{
"epoch": 0.19202363367799113,
"grad_norm": 0.4679315871943788,
"learning_rate": 1.088607594936709e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27506357431411743,
"step": 130,
"valid_targets_mean": 5003.4,
"valid_targets_min": 309
},
{
"epoch": 0.19940915805022155,
"grad_norm": 0.5203002455514378,
"learning_rate": 1.1308016877637132e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3530064821243286,
"step": 135,
"valid_targets_mean": 4744.3,
"valid_targets_min": 380
},
{
"epoch": 0.206794682422452,
"grad_norm": 0.508532245402902,
"learning_rate": 1.1729957805907175e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26319918036460876,
"step": 140,
"valid_targets_mean": 4969.9,
"valid_targets_min": 298
},
{
"epoch": 0.21418020679468242,
"grad_norm": 0.4977333684095323,
"learning_rate": 1.2151898734177216e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.281037300825119,
"step": 145,
"valid_targets_mean": 4680.9,
"valid_targets_min": 553
},
{
"epoch": 0.22156573116691286,
"grad_norm": 0.5700488921766971,
"learning_rate": 1.2573839662447258e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3317258059978485,
"step": 150,
"valid_targets_mean": 4780.8,
"valid_targets_min": 613
},
{
"epoch": 0.22895125553914328,
"grad_norm": 0.5049210471064856,
"learning_rate": 1.29957805907173e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31507956981658936,
"step": 155,
"valid_targets_mean": 4951.3,
"valid_targets_min": 648
},
{
"epoch": 0.2363367799113737,
"grad_norm": 0.48733685753987915,
"learning_rate": 1.3417721518987344e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3532077670097351,
"step": 160,
"valid_targets_mean": 5704.9,
"valid_targets_min": 615
},
{
"epoch": 0.24372230428360414,
"grad_norm": 0.478477178779921,
"learning_rate": 1.3839662447257384e-05,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25617825984954834,
"step": 165,
"valid_targets_mean": 5201.0,
"valid_targets_min": 614
},
{
"epoch": 0.2511078286558346,
"grad_norm": 0.6185796972171613,
"learning_rate": 1.4261603375527426e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018920421600342,
"step": 170,
"valid_targets_mean": 4082.6,
"valid_targets_min": 595
},
{
"epoch": 0.258493353028065,
"grad_norm": 0.5575122691401694,
"learning_rate": 1.468354430379747e-05,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911016345024109,
"step": 175,
"valid_targets_mean": 4299.9,
"valid_targets_min": 662
},
{
"epoch": 0.2658788774002954,
"grad_norm": 0.6276828580042122,
"learning_rate": 1.5105485232067512e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25065547227859497,
"step": 180,
"valid_targets_mean": 4217.5,
"valid_targets_min": 388
},
{
"epoch": 0.27326440177252587,
"grad_norm": 0.4696050024959157,
"learning_rate": 1.5527426160337554e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2493332028388977,
"step": 185,
"valid_targets_mean": 5711.5,
"valid_targets_min": 679
},
{
"epoch": 0.28064992614475626,
"grad_norm": 0.5623419824234117,
"learning_rate": 1.5949367088607598e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27796900272369385,
"step": 190,
"valid_targets_mean": 4589.1,
"valid_targets_min": 592
},
{
"epoch": 0.2880354505169867,
"grad_norm": 0.45269545432048147,
"learning_rate": 1.637130801687764e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23348630964756012,
"step": 195,
"valid_targets_mean": 6195.4,
"valid_targets_min": 1406
},
{
"epoch": 0.29542097488921715,
"grad_norm": 0.5800039153836231,
"learning_rate": 1.679324894514768e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3133583664894104,
"step": 200,
"valid_targets_mean": 4379.1,
"valid_targets_min": 577
},
{
"epoch": 0.30280649926144754,
"grad_norm": 0.4475247352688734,
"learning_rate": 1.7215189873417723e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2346859574317932,
"step": 205,
"valid_targets_mean": 5674.9,
"valid_targets_min": 516
},
{
"epoch": 0.310192023633678,
"grad_norm": 0.6043039588064852,
"learning_rate": 1.7637130801687767e-05,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2985689640045166,
"step": 210,
"valid_targets_mean": 3230.7,
"valid_targets_min": 451
},
{
"epoch": 0.3175775480059084,
"grad_norm": 0.46608512023497484,
"learning_rate": 1.8059071729957807e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667817175388336,
"step": 215,
"valid_targets_mean": 5615.9,
"valid_targets_min": 608
},
{
"epoch": 0.3249630723781389,
"grad_norm": 0.6393799102975143,
"learning_rate": 1.848101265822785e-05,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3485134243965149,
"step": 220,
"valid_targets_mean": 5232.9,
"valid_targets_min": 551
},
{
"epoch": 0.33234859675036926,
"grad_norm": 0.4985956967264833,
"learning_rate": 1.890295358649789e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22727638483047485,
"step": 225,
"valid_targets_mean": 5186.1,
"valid_targets_min": 557
},
{
"epoch": 0.3397341211225997,
"grad_norm": 0.698867408214604,
"learning_rate": 1.9324894514767935e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28445443511009216,
"step": 230,
"valid_targets_mean": 4395.3,
"valid_targets_min": 613
},
{
"epoch": 0.34711964549483015,
"grad_norm": 0.4699161647524185,
"learning_rate": 1.974683544303798e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27419084310531616,
"step": 235,
"valid_targets_mean": 6050.6,
"valid_targets_min": 697
},
{
"epoch": 0.35450516986706054,
"grad_norm": 0.49712308816298567,
"learning_rate": 2.0168776371308016e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2411026805639267,
"step": 240,
"valid_targets_mean": 6215.0,
"valid_targets_min": 375
},
{
"epoch": 0.361890694239291,
"grad_norm": 0.4755998361435196,
"learning_rate": 2.0590717299578063e-05,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31807953119277954,
"step": 245,
"valid_targets_mean": 5977.3,
"valid_targets_min": 222
},
{
"epoch": 0.36927621861152143,
"grad_norm": 0.5522737703807714,
"learning_rate": 2.1012658227848103e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637110650539398,
"step": 250,
"valid_targets_mean": 4707.1,
"valid_targets_min": 424
},
{
"epoch": 0.3766617429837518,
"grad_norm": 0.5752807812899275,
"learning_rate": 2.1434599156118144e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252408891916275,
"step": 255,
"valid_targets_mean": 4646.9,
"valid_targets_min": 620
},
{
"epoch": 0.38404726735598227,
"grad_norm": 0.4839304938690229,
"learning_rate": 2.1856540084388188e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.311644971370697,
"step": 260,
"valid_targets_mean": 6014.4,
"valid_targets_min": 320
},
{
"epoch": 0.3914327917282127,
"grad_norm": 0.3679428184390633,
"learning_rate": 2.2278481012658228e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1715935468673706,
"step": 265,
"valid_targets_mean": 7149.1,
"valid_targets_min": 708
},
{
"epoch": 0.3988183161004431,
"grad_norm": 0.4388882366281187,
"learning_rate": 2.270042194092827e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21887677907943726,
"step": 270,
"valid_targets_mean": 5259.7,
"valid_targets_min": 462
},
{
"epoch": 0.40620384047267355,
"grad_norm": 0.45156140818813745,
"learning_rate": 2.3122362869198316e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1979508399963379,
"step": 275,
"valid_targets_mean": 5245.2,
"valid_targets_min": 370
},
{
"epoch": 0.413589364844904,
"grad_norm": 0.5635183886045622,
"learning_rate": 2.3544303797468356e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2971973419189453,
"step": 280,
"valid_targets_mean": 4294.6,
"valid_targets_min": 250
},
{
"epoch": 0.42097488921713444,
"grad_norm": 0.6003559911338966,
"learning_rate": 2.39662447257384e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27018484473228455,
"step": 285,
"valid_targets_mean": 4037.1,
"valid_targets_min": 530
},
{
"epoch": 0.42836041358936483,
"grad_norm": 0.519146451009721,
"learning_rate": 2.438818565400844e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25247296690940857,
"step": 290,
"valid_targets_mean": 5198.4,
"valid_targets_min": 757
},
{
"epoch": 0.4357459379615953,
"grad_norm": 0.5295365016140835,
"learning_rate": 2.481012658227848e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30645301938056946,
"step": 295,
"valid_targets_mean": 5075.9,
"valid_targets_min": 586
},
{
"epoch": 0.4431314623338257,
"grad_norm": 0.5064359925137679,
"learning_rate": 2.5232067510548524e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27146783471107483,
"step": 300,
"valid_targets_mean": 5670.0,
"valid_targets_min": 510
},
{
"epoch": 0.4505169867060561,
"grad_norm": 0.4807884411055291,
"learning_rate": 2.5654008438818568e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.245832160115242,
"step": 305,
"valid_targets_mean": 4988.6,
"valid_targets_min": 758
},
{
"epoch": 0.45790251107828656,
"grad_norm": 0.4874621524760727,
"learning_rate": 2.6075949367088612e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22424304485321045,
"step": 310,
"valid_targets_mean": 4865.2,
"valid_targets_min": 690
},
{
"epoch": 0.465288035450517,
"grad_norm": 0.5241781469793773,
"learning_rate": 2.6497890295358652e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2541046142578125,
"step": 315,
"valid_targets_mean": 4655.8,
"valid_targets_min": 303
},
{
"epoch": 0.4726735598227474,
"grad_norm": 0.6693714356739207,
"learning_rate": 2.6919831223628693e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3150583803653717,
"step": 320,
"valid_targets_mean": 3789.6,
"valid_targets_min": 323
},
{
"epoch": 0.48005908419497784,
"grad_norm": 0.4049583166705286,
"learning_rate": 2.7341772151898737e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19988644123077393,
"step": 325,
"valid_targets_mean": 6250.1,
"valid_targets_min": 565
},
{
"epoch": 0.4874446085672083,
"grad_norm": 0.5683986043691779,
"learning_rate": 2.7763713080168777e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30885380506515503,
"step": 330,
"valid_targets_mean": 4539.6,
"valid_targets_min": 511
},
{
"epoch": 0.4948301329394387,
"grad_norm": 0.4293798580209713,
"learning_rate": 2.8185654008438824e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2373587191104889,
"step": 335,
"valid_targets_mean": 6893.3,
"valid_targets_min": 540
},
{
"epoch": 0.5022156573116692,
"grad_norm": 0.5051385898465901,
"learning_rate": 2.8607594936708865e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2349412590265274,
"step": 340,
"valid_targets_mean": 5513.8,
"valid_targets_min": 348
},
{
"epoch": 0.5096011816838996,
"grad_norm": 0.453650649705282,
"learning_rate": 2.9029535864978905e-05,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24615350365638733,
"step": 345,
"valid_targets_mean": 5636.8,
"valid_targets_min": 632
},
{
"epoch": 0.51698670605613,
"grad_norm": 0.5026094522177535,
"learning_rate": 2.945147679324895e-05,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25473105907440186,
"step": 350,
"valid_targets_mean": 4648.2,
"valid_targets_min": 618
},
{
"epoch": 0.5243722304283605,
"grad_norm": 0.5473929641026576,
"learning_rate": 2.987341772151899e-05,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25512436032295227,
"step": 355,
"valid_targets_mean": 4888.8,
"valid_targets_min": 455
},
{
"epoch": 0.5317577548005908,
"grad_norm": 0.6818407765763758,
"learning_rate": 3.029535864978903e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26583975553512573,
"step": 360,
"valid_targets_mean": 3901.6,
"valid_targets_min": 393
},
{
"epoch": 0.5391432791728212,
"grad_norm": 0.43264528877861325,
"learning_rate": 3.0717299578059074e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2336602509021759,
"step": 365,
"valid_targets_mean": 6759.1,
"valid_targets_min": 654
},
{
"epoch": 0.5465288035450517,
"grad_norm": 0.4786744793085355,
"learning_rate": 3.113924050632912e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23913979530334473,
"step": 370,
"valid_targets_mean": 5128.6,
"valid_targets_min": 436
},
{
"epoch": 0.5539143279172821,
"grad_norm": 0.6098930815067188,
"learning_rate": 3.156118143459916e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27685385942459106,
"step": 375,
"valid_targets_mean": 4722.4,
"valid_targets_min": 547
},
{
"epoch": 0.5612998522895125,
"grad_norm": 0.4884326875060275,
"learning_rate": 3.19831223628692e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269244909286499,
"step": 380,
"valid_targets_mean": 5746.3,
"valid_targets_min": 649
},
{
"epoch": 0.568685376661743,
"grad_norm": 0.6966159287505779,
"learning_rate": 3.240506329113924e-05,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25672098994255066,
"step": 385,
"valid_targets_mean": 5211.0,
"valid_targets_min": 451
},
{
"epoch": 0.5760709010339734,
"grad_norm": 0.4826433803477916,
"learning_rate": 3.282700421940928e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21904008090496063,
"step": 390,
"valid_targets_mean": 4840.0,
"valid_targets_min": 614
},
{
"epoch": 0.5834564254062038,
"grad_norm": 0.5161328067549831,
"learning_rate": 3.324894514767932e-05,
"loss": 0.2401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21546295285224915,
"step": 395,
"valid_targets_mean": 5000.8,
"valid_targets_min": 474
},
{
"epoch": 0.5908419497784343,
"grad_norm": 0.441903839632028,
"learning_rate": 3.367088607594937e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418462634086609,
"step": 400,
"valid_targets_mean": 6752.2,
"valid_targets_min": 526
},
{
"epoch": 0.5982274741506647,
"grad_norm": 0.4263460620059315,
"learning_rate": 3.409282700421941e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564152479171753,
"step": 405,
"valid_targets_mean": 5806.5,
"valid_targets_min": 581
},
{
"epoch": 0.6056129985228951,
"grad_norm": 0.4114391570850889,
"learning_rate": 3.451476793248946e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19688798487186432,
"step": 410,
"valid_targets_mean": 5193.4,
"valid_targets_min": 765
},
{
"epoch": 0.6129985228951256,
"grad_norm": 0.560472208109208,
"learning_rate": 3.49367088607595e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3748968243598938,
"step": 415,
"valid_targets_mean": 6106.8,
"valid_targets_min": 673
},
{
"epoch": 0.620384047267356,
"grad_norm": 0.4389773616307953,
"learning_rate": 3.535864978902954e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25939327478408813,
"step": 420,
"valid_targets_mean": 5600.4,
"valid_targets_min": 587
},
{
"epoch": 0.6277695716395865,
"grad_norm": 0.49005945851489136,
"learning_rate": 3.578059071729958e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2415715903043747,
"step": 425,
"valid_targets_mean": 5480.6,
"valid_targets_min": 557
},
{
"epoch": 0.6351550960118169,
"grad_norm": 0.6120232650144795,
"learning_rate": 3.6202531645569626e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27258408069610596,
"step": 430,
"valid_targets_mean": 4020.8,
"valid_targets_min": 575
},
{
"epoch": 0.6425406203840472,
"grad_norm": 0.5517761299010163,
"learning_rate": 3.6624472573839666e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571716904640198,
"step": 435,
"valid_targets_mean": 3986.9,
"valid_targets_min": 570
},
{
"epoch": 0.6499261447562777,
"grad_norm": 0.4519259500134533,
"learning_rate": 3.704641350210971e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23544706404209137,
"step": 440,
"valid_targets_mean": 5446.1,
"valid_targets_min": 798
},
{
"epoch": 0.6573116691285081,
"grad_norm": 0.4627225505498187,
"learning_rate": 3.746835443037975e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22768300771713257,
"step": 445,
"valid_targets_mean": 5305.9,
"valid_targets_min": 612
},
{
"epoch": 0.6646971935007385,
"grad_norm": 0.5459862764397345,
"learning_rate": 3.7890295358649794e-05,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2680595815181732,
"step": 450,
"valid_targets_mean": 3753.4,
"valid_targets_min": 637
},
{
"epoch": 0.672082717872969,
"grad_norm": 0.5037347511570361,
"learning_rate": 3.8312236286919835e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2467479407787323,
"step": 455,
"valid_targets_mean": 5501.6,
"valid_targets_min": 310
},
{
"epoch": 0.6794682422451994,
"grad_norm": 0.4327775289602796,
"learning_rate": 3.873417721518988e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19664692878723145,
"step": 460,
"valid_targets_mean": 5931.2,
"valid_targets_min": 913
},
{
"epoch": 0.6868537666174298,
"grad_norm": 0.4409637060996679,
"learning_rate": 3.915611814345992e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21506735682487488,
"step": 465,
"valid_targets_mean": 6059.1,
"valid_targets_min": 647
},
{
"epoch": 0.6942392909896603,
"grad_norm": 0.5504576504647792,
"learning_rate": 3.957805907172996e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2300184667110443,
"step": 470,
"valid_targets_mean": 3839.0,
"valid_targets_min": 557
},
{
"epoch": 0.7016248153618907,
"grad_norm": 0.429274562141855,
"learning_rate": 4e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2237507700920105,
"step": 475,
"valid_targets_mean": 6357.5,
"valid_targets_min": 742
},
{
"epoch": 0.7090103397341211,
"grad_norm": 0.7536006693457217,
"learning_rate": 3.9999864355811366e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22905516624450684,
"step": 480,
"valid_targets_mean": 4381.5,
"valid_targets_min": 729
},
{
"epoch": 0.7163958641063516,
"grad_norm": 0.43953758941215776,
"learning_rate": 3.99994574250854e-05,
"loss": 0.2316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20200951397418976,
"step": 485,
"valid_targets_mean": 5644.1,
"valid_targets_min": 683
},
{
"epoch": 0.723781388478582,
"grad_norm": 0.4723664561759756,
"learning_rate": 3.999877921334187e-05,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26116621494293213,
"step": 490,
"valid_targets_mean": 5649.9,
"valid_targets_min": 598
},
{
"epoch": 0.7311669128508124,
"grad_norm": 0.5372942073144541,
"learning_rate": 3.999782972978035e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597278356552124,
"step": 495,
"valid_targets_mean": 4376.8,
"valid_targets_min": 711
},
{
"epoch": 0.7385524372230429,
"grad_norm": 0.4923885109877066,
"learning_rate": 3.9996608987280005e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3310204744338989,
"step": 500,
"valid_targets_mean": 5373.9,
"valid_targets_min": 362
},
{
"epoch": 0.7459379615952733,
"grad_norm": 0.4360411302968856,
"learning_rate": 3.999511700239951e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23595163226127625,
"step": 505,
"valid_targets_mean": 5867.7,
"valid_targets_min": 747
},
{
"epoch": 0.7533234859675036,
"grad_norm": 0.4125019822494474,
"learning_rate": 3.999335379537677e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22982177138328552,
"step": 510,
"valid_targets_mean": 5860.2,
"valid_targets_min": 284
},
{
"epoch": 0.7607090103397341,
"grad_norm": 0.4816111850196653,
"learning_rate": 3.999131939012866e-05,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23170827329158783,
"step": 515,
"valid_targets_mean": 5939.9,
"valid_targets_min": 573
},
{
"epoch": 0.7680945347119645,
"grad_norm": 0.5607421617686298,
"learning_rate": 3.998901381425072e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27282047271728516,
"step": 520,
"valid_targets_mean": 4010.6,
"valid_targets_min": 308
},
{
"epoch": 0.7754800590841949,
"grad_norm": 0.4899434940882494,
"learning_rate": 3.998643709901673e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2315795123577118,
"step": 525,
"valid_targets_mean": 4446.6,
"valid_targets_min": 755
},
{
"epoch": 0.7828655834564254,
"grad_norm": 0.4551383882144779,
"learning_rate": 3.998358927937835e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21953409910202026,
"step": 530,
"valid_targets_mean": 5531.2,
"valid_targets_min": 538
},
{
"epoch": 0.7902511078286558,
"grad_norm": 0.4743224847774692,
"learning_rate": 3.9980470393964584e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23994377255439758,
"step": 535,
"valid_targets_mean": 4992.5,
"valid_targets_min": 499
},
{
"epoch": 0.7976366322008862,
"grad_norm": 0.42125006599133685,
"learning_rate": 3.997708048508131e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19587251543998718,
"step": 540,
"valid_targets_mean": 5289.6,
"valid_targets_min": 667
},
{
"epoch": 0.8050221565731167,
"grad_norm": 0.524726561877271,
"learning_rate": 3.997341959871066e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21869216859340668,
"step": 545,
"valid_targets_mean": 4091.0,
"valid_targets_min": 641
},
{
"epoch": 0.8124076809453471,
"grad_norm": 1.0978518384034786,
"learning_rate": 3.996948778451044e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2922288179397583,
"step": 550,
"valid_targets_mean": 4755.1,
"valid_targets_min": 683
},
{
"epoch": 0.8197932053175776,
"grad_norm": 0.434588106606303,
"learning_rate": 3.996528509581343e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2291834056377411,
"step": 555,
"valid_targets_mean": 6349.8,
"valid_targets_min": 911
},
{
"epoch": 0.827178729689808,
"grad_norm": 0.44781488594353586,
"learning_rate": 3.996081158962664e-05,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21667613089084625,
"step": 560,
"valid_targets_mean": 5273.2,
"valid_targets_min": 510
},
{
"epoch": 0.8345642540620384,
"grad_norm": 0.4232290679425604,
"learning_rate": 3.995606732663061e-05,
"loss": 0.2432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21859529614448547,
"step": 565,
"valid_targets_mean": 6958.2,
"valid_targets_min": 578
},
{
"epoch": 0.8419497784342689,
"grad_norm": 0.37603814378739714,
"learning_rate": 3.9951052371178484e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20742715895175934,
"step": 570,
"valid_targets_mean": 6439.2,
"valid_targets_min": 948
},
{
"epoch": 0.8493353028064993,
"grad_norm": 0.5330316503851572,
"learning_rate": 3.994576679129523e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27818042039871216,
"step": 575,
"valid_targets_mean": 4627.2,
"valid_targets_min": 603
},
{
"epoch": 0.8567208271787297,
"grad_norm": 0.48524432401103307,
"learning_rate": 3.9940210658676674e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2559252977371216,
"step": 580,
"valid_targets_mean": 4795.9,
"valid_targets_min": 476
},
{
"epoch": 0.8641063515509602,
"grad_norm": 0.49687821950248273,
"learning_rate": 3.993438404868851e-05,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22851648926734924,
"step": 585,
"valid_targets_mean": 5150.0,
"valid_targets_min": 523
},
{
"epoch": 0.8714918759231906,
"grad_norm": 0.4956097153548755,
"learning_rate": 3.9928287040365334e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29340338706970215,
"step": 590,
"valid_targets_mean": 4955.4,
"valid_targets_min": 602
},
{
"epoch": 0.8788774002954209,
"grad_norm": 0.47621975231571884,
"learning_rate": 3.992191971640951e-05,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27463576197624207,
"step": 595,
"valid_targets_mean": 5440.9,
"valid_targets_min": 602
},
{
"epoch": 0.8862629246676514,
"grad_norm": 0.4864192134736827,
"learning_rate": 3.9915282163190084e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.202743798494339,
"step": 600,
"valid_targets_mean": 4574.8,
"valid_targets_min": 529
},
{
"epoch": 0.8936484490398818,
"grad_norm": 0.4436441374970087,
"learning_rate": 3.990837447074162e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884596586227417,
"step": 605,
"valid_targets_mean": 5406.1,
"valid_targets_min": 654
},
{
"epoch": 0.9010339734121122,
"grad_norm": 0.5091014640879844,
"learning_rate": 3.990119673276294e-05,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561118006706238,
"step": 610,
"valid_targets_mean": 3856.2,
"valid_targets_min": 395
},
{
"epoch": 0.9084194977843427,
"grad_norm": 0.44293254378519337,
"learning_rate": 3.989374904661589e-05,
"loss": 0.2338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2175714075565338,
"step": 615,
"valid_targets_mean": 5307.1,
"valid_targets_min": 654
},
{
"epoch": 0.9158050221565731,
"grad_norm": 0.4969299448859931,
"learning_rate": 3.988603151332402e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23327939212322235,
"step": 620,
"valid_targets_mean": 4357.9,
"valid_targets_min": 932
},
{
"epoch": 0.9231905465288035,
"grad_norm": 0.399043646975211,
"learning_rate": 3.987804423757116e-05,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2003873586654663,
"step": 625,
"valid_targets_mean": 6620.2,
"valid_targets_min": 717
},
{
"epoch": 0.930576070901034,
"grad_norm": 0.5569804334944528,
"learning_rate": 3.986978732770008e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25180336833000183,
"step": 630,
"valid_targets_mean": 5835.9,
"valid_targets_min": 632
},
{
"epoch": 0.9379615952732644,
"grad_norm": 0.65226776693925,
"learning_rate": 3.986126089571096e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25059741735458374,
"step": 635,
"valid_targets_mean": 4920.8,
"valid_targets_min": 558
},
{
"epoch": 0.9453471196454948,
"grad_norm": 0.7108324020329172,
"learning_rate": 3.98524650572599e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2292698323726654,
"step": 640,
"valid_targets_mean": 6018.6,
"valid_targets_min": 596
},
{
"epoch": 0.9527326440177253,
"grad_norm": 0.6100872297295562,
"learning_rate": 3.984339993165733e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2530120611190796,
"step": 645,
"valid_targets_mean": 4852.8,
"valid_targets_min": 491
},
{
"epoch": 0.9601181683899557,
"grad_norm": 0.6894230566439239,
"learning_rate": 3.9834065641866405e-05,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521514594554901,
"step": 650,
"valid_targets_mean": 4665.9,
"valid_targets_min": 651
},
{
"epoch": 0.9675036927621861,
"grad_norm": 0.6477076251824874,
"learning_rate": 3.9824462314501355e-05,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21362358331680298,
"step": 655,
"valid_targets_mean": 5620.9,
"valid_targets_min": 775
},
{
"epoch": 0.9748892171344166,
"grad_norm": 0.4865282373044303,
"learning_rate": 3.981459007982573e-05,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22964204847812653,
"step": 660,
"valid_targets_mean": 4150.7,
"valid_targets_min": 476
},
{
"epoch": 0.982274741506647,
"grad_norm": 0.4265759209620169,
"learning_rate": 3.980444907175065e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23872928321361542,
"step": 665,
"valid_targets_mean": 4645.1,
"valid_targets_min": 490
},
{
"epoch": 0.9896602658788775,
"grad_norm": 0.4337931141291071,
"learning_rate": 3.979403942783301e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21394482254981995,
"step": 670,
"valid_targets_mean": 5586.5,
"valid_targets_min": 583
},
{
"epoch": 0.9970457902511078,
"grad_norm": 0.44216457771241374,
"learning_rate": 3.9783361289273565e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2214493751525879,
"step": 675,
"valid_targets_mean": 5189.8,
"valid_targets_min": 490
},
{
"epoch": 1.0044313146233383,
"grad_norm": 0.4033533200689087,
"learning_rate": 3.977241480091507e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21175044775009155,
"step": 680,
"valid_targets_mean": 6346.5,
"valid_targets_min": 2699
},
{
"epoch": 1.0118168389955686,
"grad_norm": 0.485561570780159,
"learning_rate": 3.976120011124027e-05,
"loss": 0.2282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2394808530807495,
"step": 685,
"valid_targets_mean": 5191.0,
"valid_targets_min": 764
},
{
"epoch": 1.0192023633677991,
"grad_norm": 0.4391190385256597,
"learning_rate": 3.974971737236992e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23937949538230896,
"step": 690,
"valid_targets_mean": 5908.1,
"valid_targets_min": 742
},
{
"epoch": 1.0265878877400296,
"grad_norm": 0.44514329511208256,
"learning_rate": 3.9737966740060694e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20545028150081635,
"step": 695,
"valid_targets_mean": 4889.1,
"valid_targets_min": 246
},
{
"epoch": 1.03397341211226,
"grad_norm": 0.5296228485775536,
"learning_rate": 3.97259483737031e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25395631790161133,
"step": 700,
"valid_targets_mean": 5731.1,
"valid_targets_min": 556
},
{
"epoch": 1.0413589364844904,
"grad_norm": 0.4073116341963712,
"learning_rate": 3.9713662436319283e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.234715536236763,
"step": 705,
"valid_targets_mean": 5917.2,
"valid_targets_min": 781
},
{
"epoch": 1.048744460856721,
"grad_norm": 0.4815030594150368,
"learning_rate": 3.9701109094560844e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784745395183563,
"step": 710,
"valid_targets_mean": 4806.1,
"valid_targets_min": 559
},
{
"epoch": 1.0561299852289512,
"grad_norm": 0.49302209706755173,
"learning_rate": 3.9688288518706576e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2195298820734024,
"step": 715,
"valid_targets_mean": 4878.7,
"valid_targets_min": 652
},
{
"epoch": 1.0635155096011817,
"grad_norm": 0.5556432641590098,
"learning_rate": 3.967520088266014e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3123176097869873,
"step": 720,
"valid_targets_mean": 4661.2,
"valid_targets_min": 459
},
{
"epoch": 1.0709010339734122,
"grad_norm": 0.4534308645642078,
"learning_rate": 3.96618463639477e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2006494402885437,
"step": 725,
"valid_targets_mean": 4573.6,
"valid_targets_min": 623
},
{
"epoch": 1.0782865583456425,
"grad_norm": 0.47188855620624076,
"learning_rate": 3.9648225143715565e-05,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2375321090221405,
"step": 730,
"valid_targets_mean": 5050.3,
"valid_targets_min": 697
},
{
"epoch": 1.085672082717873,
"grad_norm": 0.5815500233739369,
"learning_rate": 3.9634337406727646e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2476039081811905,
"step": 735,
"valid_targets_mean": 4952.1,
"valid_targets_min": 620
},
{
"epoch": 1.0930576070901035,
"grad_norm": 0.44455506894558233,
"learning_rate": 3.962018334136304e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2000984251499176,
"step": 740,
"valid_targets_mean": 5665.1,
"valid_targets_min": 564
},
{
"epoch": 1.1004431314623337,
"grad_norm": 0.41891782048261406,
"learning_rate": 3.960576313961342e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20635861158370972,
"step": 745,
"valid_targets_mean": 5981.8,
"valid_targets_min": 553
},
{
"epoch": 1.1078286558345642,
"grad_norm": 0.43106390225148533,
"learning_rate": 3.9591076997080425e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23344707489013672,
"step": 750,
"valid_targets_mean": 5677.6,
"valid_targets_min": 682
},
{
"epoch": 1.1152141802067947,
"grad_norm": 0.41866856940372654,
"learning_rate": 3.9576125112973064e-05,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2010667622089386,
"step": 755,
"valid_targets_mean": 5764.6,
"valid_targets_min": 755
},
{
"epoch": 1.122599704579025,
"grad_norm": 0.3898308822960811,
"learning_rate": 3.956090769010495e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21998938918113708,
"step": 760,
"valid_targets_mean": 7065.8,
"valid_targets_min": 606
},
{
"epoch": 1.1299852289512555,
"grad_norm": 0.4317215373352644,
"learning_rate": 3.954542493489158e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23063355684280396,
"step": 765,
"valid_targets_mean": 6418.8,
"valid_targets_min": 710
},
{
"epoch": 1.137370753323486,
"grad_norm": 0.4412576392418719,
"learning_rate": 3.952967705734752e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20747151970863342,
"step": 770,
"valid_targets_mean": 5115.1,
"valid_targets_min": 600
},
{
"epoch": 1.1447562776957163,
"grad_norm": 0.5452994774328421,
"learning_rate": 3.951366427108359e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2622203826904297,
"step": 775,
"valid_targets_mean": 3728.9,
"valid_targets_min": 762
},
{
"epoch": 1.1521418020679468,
"grad_norm": 0.4161239474977219,
"learning_rate": 3.9497386793303934e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23140665888786316,
"step": 780,
"valid_targets_mean": 6516.1,
"valid_targets_min": 521
},
{
"epoch": 1.1595273264401773,
"grad_norm": 0.4996982771781497,
"learning_rate": 3.9480844844803065e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21708938479423523,
"step": 785,
"valid_targets_mean": 4092.6,
"valid_targets_min": 491
},
{
"epoch": 1.1669128508124076,
"grad_norm": 0.43107207086038685,
"learning_rate": 3.946403864996291e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19202640652656555,
"step": 790,
"valid_targets_mean": 5623.8,
"valid_targets_min": 567
},
{
"epoch": 1.174298375184638,
"grad_norm": 0.6020812405004927,
"learning_rate": 3.944696843674973e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.267403244972229,
"step": 795,
"valid_targets_mean": 3391.2,
"valid_targets_min": 617
},
{
"epoch": 1.1816838995568686,
"grad_norm": 0.4663676848971227,
"learning_rate": 3.942963443671105e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2613796889781952,
"step": 800,
"valid_targets_mean": 5378.3,
"valid_targets_min": 552
},
{
"epoch": 1.1890694239290989,
"grad_norm": 0.4485332389236638,
"learning_rate": 3.9412036884972515e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2017560601234436,
"step": 805,
"valid_targets_mean": 4622.5,
"valid_targets_min": 531
},
{
"epoch": 1.1964549483013294,
"grad_norm": 0.47317157878156907,
"learning_rate": 3.939417602023467e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027883231639862,
"step": 810,
"valid_targets_mean": 4890.3,
"valid_targets_min": 638
},
{
"epoch": 1.2038404726735599,
"grad_norm": 0.5193762458310359,
"learning_rate": 3.937605208476979e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23114809393882751,
"step": 815,
"valid_targets_mean": 4104.7,
"valid_targets_min": 659
},
{
"epoch": 1.2112259970457901,
"grad_norm": 0.5116940935110126,
"learning_rate": 3.93576653244185e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086828291416168,
"step": 820,
"valid_targets_mean": 5347.4,
"valid_targets_min": 692
},
{
"epoch": 1.2186115214180206,
"grad_norm": 0.6948645135111495,
"learning_rate": 3.933901598858653e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23770800232887268,
"step": 825,
"valid_targets_mean": 4581.4,
"valid_targets_min": 575
},
{
"epoch": 1.2259970457902511,
"grad_norm": 0.3666222705529873,
"learning_rate": 3.9320104330241294e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20173095166683197,
"step": 830,
"valid_targets_mean": 7597.5,
"valid_targets_min": 563
},
{
"epoch": 1.2333825701624814,
"grad_norm": 0.4553744544104897,
"learning_rate": 3.9300930605908434e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501322031021118,
"step": 835,
"valid_targets_mean": 5175.3,
"valid_targets_min": 477
},
{
"epoch": 1.240768094534712,
"grad_norm": 0.4074174770824338,
"learning_rate": 3.928149507566838e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21756581962108612,
"step": 840,
"valid_targets_mean": 5838.4,
"valid_targets_min": 709
},
{
"epoch": 1.2481536189069424,
"grad_norm": 0.3903886869594378,
"learning_rate": 3.926179800315281e-05,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19205650687217712,
"step": 845,
"valid_targets_mean": 5413.8,
"valid_targets_min": 497
},
{
"epoch": 1.2555391432791727,
"grad_norm": 0.48872055489952576,
"learning_rate": 3.924183965554106e-05,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2304544299840927,
"step": 850,
"valid_targets_mean": 5223.9,
"valid_targets_min": 362
},
{
"epoch": 1.2629246676514032,
"grad_norm": 0.5971024562814735,
"learning_rate": 3.9221620303556515e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1931340992450714,
"step": 855,
"valid_targets_mean": 6235.6,
"valid_targets_min": 698
},
{
"epoch": 1.2703101920236337,
"grad_norm": 0.441865132454004,
"learning_rate": 3.9201140221462947e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19833971560001373,
"step": 860,
"valid_targets_mean": 4980.0,
"valid_targets_min": 229
},
{
"epoch": 1.277695716395864,
"grad_norm": 0.448378137812601,
"learning_rate": 3.918039968706076e-05,
"loss": 0.2303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2166500836610794,
"step": 865,
"valid_targets_mean": 4924.2,
"valid_targets_min": 586
},
{
"epoch": 1.2850812407680945,
"grad_norm": 0.38685678373728877,
"learning_rate": 3.9159398981683245e-05,
"loss": 0.2115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17539414763450623,
"step": 870,
"valid_targets_mean": 6035.1,
"valid_targets_min": 928
},
{
"epoch": 1.292466765140325,
"grad_norm": 0.4163449238539416,
"learning_rate": 3.9138138390192776e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2028162181377411,
"step": 875,
"valid_targets_mean": 5722.0,
"valid_targets_min": 752
},
{
"epoch": 1.2998522895125553,
"grad_norm": 0.5685979494164379,
"learning_rate": 3.911661820097691e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27309101819992065,
"step": 880,
"valid_targets_mean": 3300.4,
"valid_targets_min": 311
},
{
"epoch": 1.3072378138847858,
"grad_norm": 0.4369045779107333,
"learning_rate": 3.909483870594452e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2015451192855835,
"step": 885,
"valid_targets_mean": 5269.7,
"valid_targets_min": 571
},
{
"epoch": 1.3146233382570163,
"grad_norm": 0.4193133405997814,
"learning_rate": 3.9072800200521785e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21048672497272491,
"step": 890,
"valid_targets_mean": 5464.1,
"valid_targets_min": 748
},
{
"epoch": 1.3220088626292466,
"grad_norm": 0.388531558281405,
"learning_rate": 3.905050298364824e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16509976983070374,
"step": 895,
"valid_targets_mean": 5191.9,
"valid_targets_min": 517
},
{
"epoch": 1.329394387001477,
"grad_norm": 0.47820157235033706,
"learning_rate": 3.9027947357772664e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2072378247976303,
"step": 900,
"valid_targets_mean": 4629.8,
"valid_targets_min": 702
},
{
"epoch": 1.3367799113737076,
"grad_norm": 0.4354737992607275,
"learning_rate": 3.900513362884901e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20593631267547607,
"step": 905,
"valid_targets_mean": 4609.3,
"valid_targets_min": 531
},
{
"epoch": 1.3441654357459378,
"grad_norm": 0.49663576162369527,
"learning_rate": 3.8982062106332264e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23853272199630737,
"step": 910,
"valid_targets_mean": 3835.1,
"valid_targets_min": 564
},
{
"epoch": 1.3515509601181683,
"grad_norm": 0.46267728260164404,
"learning_rate": 3.895873310317422e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20141030848026276,
"step": 915,
"valid_targets_mean": 4257.8,
"valid_targets_min": 807
},
{
"epoch": 1.3589364844903988,
"grad_norm": 0.4318042167691161,
"learning_rate": 3.893514693581924e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23438894748687744,
"step": 920,
"valid_targets_mean": 5685.5,
"valid_targets_min": 637
},
{
"epoch": 1.3663220088626291,
"grad_norm": 0.46703807691935706,
"learning_rate": 3.8911303924199976e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22170604765415192,
"step": 925,
"valid_targets_mean": 4579.6,
"valid_targets_min": 648
},
{
"epoch": 1.3737075332348596,
"grad_norm": 0.49253435998552936,
"learning_rate": 3.888720439173304e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18895632028579712,
"step": 930,
"valid_targets_mean": 5223.1,
"valid_targets_min": 874
},
{
"epoch": 1.3810930576070901,
"grad_norm": 0.37295680843818396,
"learning_rate": 3.886284866531457e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23819585144519806,
"step": 935,
"valid_targets_mean": 7344.1,
"valid_targets_min": 516
},
{
"epoch": 1.3884785819793206,
"grad_norm": 0.45860088434234825,
"learning_rate": 3.883823707531585e-05,
"loss": 0.2207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20355328917503357,
"step": 940,
"valid_targets_mean": 4777.0,
"valid_targets_min": 822
},
{
"epoch": 1.395864106351551,
"grad_norm": 0.4813637468871037,
"learning_rate": 3.8813369955578795e-05,
"loss": 0.2443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24247971177101135,
"step": 945,
"valid_targets_mean": 4676.9,
"valid_targets_min": 461
},
{
"epoch": 1.4032496307237814,
"grad_norm": 0.44965533755939013,
"learning_rate": 3.878824764341143e-05,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948012351989746,
"step": 950,
"valid_targets_mean": 6391.8,
"valid_targets_min": 665
},
{
"epoch": 1.410635155096012,
"grad_norm": 0.4957030075557271,
"learning_rate": 3.876287047958331e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564036250114441,
"step": 955,
"valid_targets_mean": 4930.7,
"valid_targets_min": 709
},
{
"epoch": 1.4180206794682422,
"grad_norm": 0.4689797114164809,
"learning_rate": 3.8737238808320936e-05,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23838871717453003,
"step": 960,
"valid_targets_mean": 4520.2,
"valid_targets_min": 581
},
{
"epoch": 1.4254062038404727,
"grad_norm": 0.45226562564371103,
"learning_rate": 3.8711352977303015e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19582833349704742,
"step": 965,
"valid_targets_mean": 4792.9,
"valid_targets_min": 336
},
{
"epoch": 1.4327917282127032,
"grad_norm": 0.4499057955750725,
"learning_rate": 3.868521333765581e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21399438381195068,
"step": 970,
"valid_targets_mean": 5207.8,
"valid_targets_min": 535
},
{
"epoch": 1.4401772525849335,
"grad_norm": 0.3550283452289212,
"learning_rate": 3.865882024394834e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17050230503082275,
"step": 975,
"valid_targets_mean": 6535.8,
"valid_targets_min": 578
},
{
"epoch": 1.447562776957164,
"grad_norm": 0.3851306477864997,
"learning_rate": 3.863217405418759e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.205580934882164,
"step": 980,
"valid_targets_mean": 5663.9,
"valid_targets_min": 868
},
{
"epoch": 1.4549483013293945,
"grad_norm": 0.5896596645032985,
"learning_rate": 3.8605275129813626e-05,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21005357801914215,
"step": 985,
"valid_targets_mean": 4708.6,
"valid_targets_min": 768
},
{
"epoch": 1.4623338257016247,
"grad_norm": 0.48610764474272555,
"learning_rate": 3.857812383569473e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22247350215911865,
"step": 990,
"valid_targets_mean": 5245.6,
"valid_targets_min": 643
},
{
"epoch": 1.4697193500738552,
"grad_norm": 0.4265714039395906,
"learning_rate": 3.8550720540122436e-05,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506152391433716,
"step": 995,
"valid_targets_mean": 5852.4,
"valid_targets_min": 679
},
{
"epoch": 1.4771048744460857,
"grad_norm": 0.418243711485139,
"learning_rate": 3.852306561480652e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25498437881469727,
"step": 1000,
"valid_targets_mean": 6060.9,
"valid_targets_min": 585
},
{
"epoch": 1.4844903988183162,
"grad_norm": 0.5725357827213264,
"learning_rate": 3.8495159434869966e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.222720205783844,
"step": 1005,
"valid_targets_mean": 5578.1,
"valid_targets_min": 424
},
{
"epoch": 1.4918759231905465,
"grad_norm": 0.7420773277261102,
"learning_rate": 3.846700237884389e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2858394980430603,
"step": 1010,
"valid_targets_mean": 3759.1,
"valid_targets_min": 407
},
{
"epoch": 1.499261447562777,
"grad_norm": 0.4640644425487349,
"learning_rate": 3.84385948286624e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21131858229637146,
"step": 1015,
"valid_targets_mean": 4703.7,
"valid_targets_min": 460
},
{
"epoch": 1.5066469719350075,
"grad_norm": 0.47403611928498096,
"learning_rate": 3.8409937169657393e-05,
"loss": 0.2401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791014313697815,
"step": 1020,
"valid_targets_mean": 5770.7,
"valid_targets_min": 572
},
{
"epoch": 1.5140324963072378,
"grad_norm": 0.3527301227310117,
"learning_rate": 3.8381029790553376e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21376456320285797,
"step": 1025,
"valid_targets_mean": 7688.9,
"valid_targets_min": 1061
},
{
"epoch": 1.5214180206794683,
"grad_norm": 0.48244790889065403,
"learning_rate": 3.8351873083462135e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22939425706863403,
"step": 1030,
"valid_targets_mean": 3952.4,
"valid_targets_min": 614
},
{
"epoch": 1.5288035450516988,
"grad_norm": 0.4441322237358841,
"learning_rate": 3.832246744387746e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19595670700073242,
"step": 1035,
"valid_targets_mean": 5734.9,
"valid_targets_min": 602
},
{
"epoch": 1.536189069423929,
"grad_norm": 0.42687842371627116,
"learning_rate": 3.829281327066977e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2039499282836914,
"step": 1040,
"valid_targets_mean": 5575.5,
"valid_targets_min": 567
},
{
"epoch": 1.5435745937961596,
"grad_norm": 0.4616898715899763,
"learning_rate": 3.826291096608068e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24281984567642212,
"step": 1045,
"valid_targets_mean": 4569.6,
"valid_targets_min": 566
},
{
"epoch": 1.55096011816839,
"grad_norm": 0.516188071513123,
"learning_rate": 3.823276093571758e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23861096799373627,
"step": 1050,
"valid_targets_mean": 5593.9,
"valid_targets_min": 756
},
{
"epoch": 1.5583456425406204,
"grad_norm": 0.4323810628023057,
"learning_rate": 3.820236358854812e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18166664242744446,
"step": 1055,
"valid_targets_mean": 5191.4,
"valid_targets_min": 548
},
{
"epoch": 1.5657311669128509,
"grad_norm": 0.41249483128752723,
"learning_rate": 3.817171933689464e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21327346563339233,
"step": 1060,
"valid_targets_mean": 6157.4,
"valid_targets_min": 587
},
{
"epoch": 1.5731166912850814,
"grad_norm": 0.4280649794546595,
"learning_rate": 3.81408285964286e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2045423984527588,
"step": 1065,
"valid_targets_mean": 5231.2,
"valid_targets_min": 583
},
{
"epoch": 1.5805022156573116,
"grad_norm": 0.3567235937466317,
"learning_rate": 3.810969178616495e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1872180700302124,
"step": 1070,
"valid_targets_mean": 6435.2,
"valid_targets_min": 828
},
{
"epoch": 1.5878877400295421,
"grad_norm": 0.3967044287073082,
"learning_rate": 3.807830932845643e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21867504715919495,
"step": 1075,
"valid_targets_mean": 5695.5,
"valid_targets_min": 370
},
{
"epoch": 1.5952732644017726,
"grad_norm": 0.4258406051484541,
"learning_rate": 3.8046681648987826e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21099427342414856,
"step": 1080,
"valid_targets_mean": 5131.6,
"valid_targets_min": 578
},
{
"epoch": 1.602658788774003,
"grad_norm": 0.4734317720239788,
"learning_rate": 3.801480917677025e-05,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20774179697036743,
"step": 1085,
"valid_targets_mean": 3967.3,
"valid_targets_min": 535
},
{
"epoch": 1.6100443131462334,
"grad_norm": 0.44845704175379064,
"learning_rate": 3.798269234413525e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22882190346717834,
"step": 1090,
"valid_targets_mean": 4234.2,
"valid_targets_min": 453
},
{
"epoch": 1.617429837518464,
"grad_norm": 0.43870094592908176,
"learning_rate": 3.795033158672901e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20205071568489075,
"step": 1095,
"valid_targets_mean": 4710.2,
"valid_targets_min": 390
},
{
"epoch": 1.6248153618906942,
"grad_norm": 0.46114331054142615,
"learning_rate": 3.7917727343506384e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2182081788778305,
"step": 1100,
"valid_targets_mean": 4210.6,
"valid_targets_min": 630
},
{
"epoch": 1.6322008862629247,
"grad_norm": 0.46898057951501565,
"learning_rate": 3.788488005672499e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18588444590568542,
"step": 1105,
"valid_targets_mean": 5456.4,
"valid_targets_min": 697
},
{
"epoch": 1.6395864106351552,
"grad_norm": 0.46882204005729433,
"learning_rate": 3.785179017193918e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911528944969177,
"step": 1110,
"valid_targets_mean": 5871.7,
"valid_targets_min": 546
},
{
"epoch": 1.6469719350073855,
"grad_norm": 0.5024285712997323,
"learning_rate": 3.781845813799402e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931421101093292,
"step": 1115,
"valid_targets_mean": 4670.3,
"valid_targets_min": 451
},
{
"epoch": 1.654357459379616,
"grad_norm": 0.42105185416660457,
"learning_rate": 3.778488440701918e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22011511027812958,
"step": 1120,
"valid_targets_mean": 4687.1,
"valid_targets_min": 298
},
{
"epoch": 1.6617429837518465,
"grad_norm": 0.4534305852538249,
"learning_rate": 3.77510694344228e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18383678793907166,
"step": 1125,
"valid_targets_mean": 5405.8,
"valid_targets_min": 726
},
{
"epoch": 1.6691285081240768,
"grad_norm": 0.3951289835886458,
"learning_rate": 3.771701367888534e-05,
"loss": 0.2383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17336603999137878,
"step": 1130,
"valid_targets_mean": 5009.2,
"valid_targets_min": 395
},
{
"epoch": 1.6765140324963073,
"grad_norm": 0.4886944664495892,
"learning_rate": 3.7682717602353336e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2188146710395813,
"step": 1135,
"valid_targets_mean": 3926.0,
"valid_targets_min": 310
},
{
"epoch": 1.6838995568685378,
"grad_norm": 0.39480650462231015,
"learning_rate": 3.7648181670033125e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20998279750347137,
"step": 1140,
"valid_targets_mean": 6034.9,
"valid_targets_min": 592
},
{
"epoch": 1.691285081240768,
"grad_norm": 0.39214825097931927,
"learning_rate": 3.761340635038456e-05,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1979064792394638,
"step": 1145,
"valid_targets_mean": 7045.8,
"valid_targets_min": 525
},
{
"epoch": 1.6986706056129985,
"grad_norm": 0.38111774464102766,
"learning_rate": 3.7578392115114655e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20325309038162231,
"step": 1150,
"valid_targets_mean": 6202.9,
"valid_targets_min": 630
},
{
"epoch": 1.706056129985229,
"grad_norm": 0.404770101827888,
"learning_rate": 3.754313943917115e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1922975480556488,
"step": 1155,
"valid_targets_mean": 5763.9,
"valid_targets_min": 528
},
{
"epoch": 1.7134416543574593,
"grad_norm": 0.4064959538938459,
"learning_rate": 3.7507648800736116e-05,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2195628136396408,
"step": 1160,
"valid_targets_mean": 5726.2,
"valid_targets_min": 795
},
{
"epoch": 1.7208271787296898,
"grad_norm": 0.5078776991250893,
"learning_rate": 3.747192068121943e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24034610390663147,
"step": 1165,
"valid_targets_mean": 4283.9,
"valid_targets_min": 309
},
{
"epoch": 1.7282127031019203,
"grad_norm": 0.5067333046365079,
"learning_rate": 3.743595556525228e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2246871292591095,
"step": 1170,
"valid_targets_mean": 3702.9,
"valid_targets_min": 529
},
{
"epoch": 1.7355982274741506,
"grad_norm": 0.5019937895256118,
"learning_rate": 3.7399753940680556e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20047210156917572,
"step": 1175,
"valid_targets_mean": 3960.8,
"valid_targets_min": 472
},
{
"epoch": 1.742983751846381,
"grad_norm": 0.41047915116673045,
"learning_rate": 3.736331629855826e-05,
"loss": 0.2262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2049740105867386,
"step": 1180,
"valid_targets_mean": 5736.0,
"valid_targets_min": 815
},
{
"epoch": 1.7503692762186116,
"grad_norm": 0.3945106153005012,
"learning_rate": 3.7326643133140833e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20625770092010498,
"step": 1185,
"valid_targets_mean": 6195.1,
"valid_targets_min": 250
},
{
"epoch": 1.7577548005908419,
"grad_norm": 0.4106742085350737,
"learning_rate": 3.7289734941878455e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24206054210662842,
"step": 1190,
"valid_targets_mean": 6082.2,
"valid_targets_min": 568
},
{
"epoch": 1.7651403249630724,
"grad_norm": 0.5200799032564574,
"learning_rate": 3.7252592225409285e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28392231464385986,
"step": 1195,
"valid_targets_mean": 3605.9,
"valid_targets_min": 523
},
{
"epoch": 1.7725258493353029,
"grad_norm": 0.470687041134897,
"learning_rate": 3.721521548755269e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21265387535095215,
"step": 1200,
"valid_targets_mean": 4151.9,
"valid_targets_min": 541
},
{
"epoch": 1.7799113737075332,
"grad_norm": 0.4428156443932358,
"learning_rate": 3.71776052353024e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21042832732200623,
"step": 1205,
"valid_targets_mean": 5545.3,
"valid_targets_min": 701
},
{
"epoch": 1.7872968980797637,
"grad_norm": 0.45448533560080073,
"learning_rate": 3.7139761978819625e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27311086654663086,
"step": 1210,
"valid_targets_mean": 5298.8,
"valid_targets_min": 628
},
{
"epoch": 1.7946824224519942,
"grad_norm": 0.4157213284903144,
"learning_rate": 3.7101686231426145e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21213330328464508,
"step": 1215,
"valid_targets_mean": 5659.4,
"valid_targets_min": 830
},
{
"epoch": 1.8020679468242244,
"grad_norm": 0.3921888627239872,
"learning_rate": 3.706337850959736e-05,
"loss": 0.2073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20621275901794434,
"step": 1220,
"valid_targets_mean": 6066.2,
"valid_targets_min": 679
},
{
"epoch": 1.809453471196455,
"grad_norm": 0.393703088132589,
"learning_rate": 3.702483933295524e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20170754194259644,
"step": 1225,
"valid_targets_mean": 5131.7,
"valid_targets_min": 594
},
{
"epoch": 1.8168389955686854,
"grad_norm": 0.429085603448917,
"learning_rate": 3.698606922426133e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21911361813545227,
"step": 1230,
"valid_targets_mean": 6525.8,
"valid_targets_min": 673
},
{
"epoch": 1.8242245199409157,
"grad_norm": 0.41690498546700655,
"learning_rate": 3.694706870940961e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20087522268295288,
"step": 1235,
"valid_targets_mean": 5197.6,
"valid_targets_min": 656
},
{
"epoch": 1.8316100443131462,
"grad_norm": 0.4214260567191511,
"learning_rate": 3.690783831741942e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24707287549972534,
"step": 1240,
"valid_targets_mean": 5131.9,
"valid_targets_min": 642
},
{
"epoch": 1.8389955686853767,
"grad_norm": 0.42497684417714315,
"learning_rate": 3.686837858042821e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418084293603897,
"step": 1245,
"valid_targets_mean": 6411.4,
"valid_targets_min": 726
},
{
"epoch": 1.846381093057607,
"grad_norm": 0.43456506500215386,
"learning_rate": 3.6828690033684394e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23421086370944977,
"step": 1250,
"valid_targets_mean": 4884.8,
"valid_targets_min": 637
},
{
"epoch": 1.8537666174298375,
"grad_norm": 0.3590270619837384,
"learning_rate": 3.678877321554003e-05,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19189848005771637,
"step": 1255,
"valid_targets_mean": 6340.3,
"valid_targets_min": 588
},
{
"epoch": 1.861152141802068,
"grad_norm": 0.4491792252049705,
"learning_rate": 3.674862866744358e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23957936465740204,
"step": 1260,
"valid_targets_mean": 4542.8,
"valid_targets_min": 638
},
{
"epoch": 1.8685376661742983,
"grad_norm": 0.41595374872963425,
"learning_rate": 3.6708256933932485e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19980810582637787,
"step": 1265,
"valid_targets_mean": 5785.6,
"valid_targets_min": 379
},
{
"epoch": 1.8759231905465288,
"grad_norm": 0.47288076543534235,
"learning_rate": 3.6667658562625867e-05,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2654092311859131,
"step": 1270,
"valid_targets_mean": 5471.1,
"valid_targets_min": 666
},
{
"epoch": 1.8833087149187593,
"grad_norm": 0.38192384234870763,
"learning_rate": 3.662683410421703e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19015946984291077,
"step": 1275,
"valid_targets_mean": 5607.4,
"valid_targets_min": 810
},
{
"epoch": 1.8906942392909896,
"grad_norm": 0.4085790502454245,
"learning_rate": 3.6585784112466034e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23992851376533508,
"step": 1280,
"valid_targets_mean": 5566.8,
"valid_targets_min": 706
},
{
"epoch": 1.89807976366322,
"grad_norm": 0.3923685608209056,
"learning_rate": 3.6544509144192153e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19036059081554413,
"step": 1285,
"valid_targets_mean": 5585.4,
"valid_targets_min": 766
},
{
"epoch": 1.9054652880354506,
"grad_norm": 0.460825966848905,
"learning_rate": 3.650300975926635e-05,
"loss": 0.2309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20123234391212463,
"step": 1290,
"valid_targets_mean": 4738.8,
"valid_targets_min": 476
},
{
"epoch": 1.9128508124076808,
"grad_norm": 0.46958242857442417,
"learning_rate": 3.646128652060367e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20810635387897491,
"step": 1295,
"valid_targets_mean": 4939.5,
"valid_targets_min": 640
},
{
"epoch": 1.9202363367799113,
"grad_norm": 0.513107015645425,
"learning_rate": 3.6419339994155596e-05,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23249667882919312,
"step": 1300,
"valid_targets_mean": 3900.5,
"valid_targets_min": 512
},
{
"epoch": 1.9276218611521418,
"grad_norm": 0.41491988804017377,
"learning_rate": 3.637717074890238e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20350153744220734,
"step": 1305,
"valid_targets_mean": 5207.5,
"valid_targets_min": 687
},
{
"epoch": 1.9350073855243721,
"grad_norm": 0.3852016695481521,
"learning_rate": 3.633477935684532e-05,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16912466287612915,
"step": 1310,
"valid_targets_mean": 5948.2,
"valid_targets_min": 558
},
{
"epoch": 1.9423929098966026,
"grad_norm": 0.47994385762704583,
"learning_rate": 3.629216639299903e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2138756513595581,
"step": 1315,
"valid_targets_mean": 4660.0,
"valid_targets_min": 546
},
{
"epoch": 1.9497784342688331,
"grad_norm": 0.43044739199814863,
"learning_rate": 3.624933243538359e-05,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20759987831115723,
"step": 1320,
"valid_targets_mean": 4612.2,
"valid_targets_min": 586
},
{
"epoch": 1.9571639586410634,
"grad_norm": 0.44206360398309225,
"learning_rate": 3.6206278065016744e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20062926411628723,
"step": 1325,
"valid_targets_mean": 4257.2,
"valid_targets_min": 474
},
{
"epoch": 1.964549483013294,
"grad_norm": 0.832328393558017,
"learning_rate": 3.616300386590601e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2263094186782837,
"step": 1330,
"valid_targets_mean": 3523.4,
"valid_targets_min": 320
},
{
"epoch": 1.9719350073855244,
"grad_norm": 0.5608605363552897,
"learning_rate": 3.6119510425040746e-05,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2241973727941513,
"step": 1335,
"valid_targets_mean": 3184.9,
"valid_targets_min": 400
},
{
"epoch": 1.9793205317577547,
"grad_norm": 0.42827418469595757,
"learning_rate": 3.6075798332384205e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21591341495513916,
"step": 1340,
"valid_targets_mean": 5014.1,
"valid_targets_min": 703
},
{
"epoch": 1.9867060561299852,
"grad_norm": 0.4376829994779159,
"learning_rate": 3.603186818086552e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24252906441688538,
"step": 1345,
"valid_targets_mean": 5612.9,
"valid_targets_min": 843
},
{
"epoch": 1.9940915805022157,
"grad_norm": 0.48296281574524147,
"learning_rate": 3.598772056637166e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911834716796875,
"step": 1350,
"valid_targets_mean": 5862.9,
"valid_targets_min": 542
},
{
"epoch": 2.001477104874446,
"grad_norm": 0.4285021994401378,
"learning_rate": 3.594335608773937e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17348650097846985,
"step": 1355,
"valid_targets_mean": 5699.8,
"valid_targets_min": 622
},
{
"epoch": 2.0088626292466767,
"grad_norm": 0.5571499078773812,
"learning_rate": 3.589877534674702e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21984922885894775,
"step": 1360,
"valid_targets_mean": 4844.9,
"valid_targets_min": 310
},
{
"epoch": 2.016248153618907,
"grad_norm": 0.4762775499228357,
"learning_rate": 3.585397894810645e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565491497516632,
"step": 1365,
"valid_targets_mean": 5172.8,
"valid_targets_min": 531
},
{
"epoch": 2.0236336779911372,
"grad_norm": 0.4890064307141238,
"learning_rate": 3.580896749945478e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.198519766330719,
"step": 1370,
"valid_targets_mean": 5031.6,
"valid_targets_min": 709
},
{
"epoch": 2.031019202363368,
"grad_norm": 0.42188127103720335,
"learning_rate": 3.576374161134614e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17222025990486145,
"step": 1375,
"valid_targets_mean": 5100.7,
"valid_targets_min": 506
},
{
"epoch": 2.0384047267355982,
"grad_norm": 0.4032153526008752,
"learning_rate": 3.571830189724344e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22092564404010773,
"step": 1380,
"valid_targets_mean": 6401.4,
"valid_targets_min": 733
},
{
"epoch": 2.0457902511078285,
"grad_norm": 0.4090149314677475,
"learning_rate": 3.5672648973509975e-05,
"loss": 0.2037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19857646524906158,
"step": 1385,
"valid_targets_mean": 5839.8,
"valid_targets_min": 589
},
{
"epoch": 2.0531757754800593,
"grad_norm": 0.4666629189772267,
"learning_rate": 3.5626783459401136e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22908130288124084,
"step": 1390,
"valid_targets_mean": 4732.4,
"valid_targets_min": 481
},
{
"epoch": 2.0605612998522895,
"grad_norm": 0.5167728208836535,
"learning_rate": 3.558070597705597e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30561476945877075,
"step": 1395,
"valid_targets_mean": 5980.4,
"valid_targets_min": 499
},
{
"epoch": 2.06794682422452,
"grad_norm": 0.4957521107813994,
"learning_rate": 3.553441715148874e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24766743183135986,
"step": 1400,
"valid_targets_mean": 5423.2,
"valid_targets_min": 636
},
{
"epoch": 2.0753323485967505,
"grad_norm": 0.5065232042372999,
"learning_rate": 3.5487917610580464e-05,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19253401458263397,
"step": 1405,
"valid_targets_mean": 4459.0,
"valid_targets_min": 731
},
{
"epoch": 2.082717872968981,
"grad_norm": 0.4366761703530371,
"learning_rate": 3.5441207985070405e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20609664916992188,
"step": 1410,
"valid_targets_mean": 5449.8,
"valid_targets_min": 973
},
{
"epoch": 2.090103397341211,
"grad_norm": 0.3956592099323369,
"learning_rate": 3.5394288908547476e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1563621610403061,
"step": 1415,
"valid_targets_mean": 5519.1,
"valid_targets_min": 520
},
{
"epoch": 2.097488921713442,
"grad_norm": 0.5353026127089262,
"learning_rate": 3.534716101744168e-05,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1830843836069107,
"step": 1420,
"valid_targets_mean": 3676.1,
"valid_targets_min": 541
},
{
"epoch": 2.104874446085672,
"grad_norm": 0.4240842603893816,
"learning_rate": 3.529982495101549e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1899888962507248,
"step": 1425,
"valid_targets_mean": 5484.6,
"valid_targets_min": 573
},
{
"epoch": 2.1122599704579024,
"grad_norm": 0.4026373876082126,
"learning_rate": 3.5252281351355124e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18199166655540466,
"step": 1430,
"valid_targets_mean": 5762.3,
"valid_targets_min": 564
},
{
"epoch": 2.119645494830133,
"grad_norm": 0.40632759254314066,
"learning_rate": 3.520453086336188e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1754504293203354,
"step": 1435,
"valid_targets_mean": 5398.9,
"valid_targets_min": 642
},
{
"epoch": 2.1270310192023634,
"grad_norm": 0.35808057513210484,
"learning_rate": 3.515657413474339e-05,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13614241778850555,
"step": 1440,
"valid_targets_mean": 6742.3,
"valid_targets_min": 736
},
{
"epoch": 2.1344165435745936,
"grad_norm": 0.4139451850923316,
"learning_rate": 3.5108411816004796e-05,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15198799967765808,
"step": 1445,
"valid_targets_mean": 4605.1,
"valid_targets_min": 696
},
{
"epoch": 2.1418020679468244,
"grad_norm": 0.4487084052336881,
"learning_rate": 3.506004456043997e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18390825390815735,
"step": 1450,
"valid_targets_mean": 4883.0,
"valid_targets_min": 631
},
{
"epoch": 2.1491875923190547,
"grad_norm": 0.4525728518238653,
"learning_rate": 3.501147302412263e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22244812548160553,
"step": 1455,
"valid_targets_mean": 4889.0,
"valid_targets_min": 640
},
{
"epoch": 2.156573116691285,
"grad_norm": 0.4649134318287312,
"learning_rate": 3.496269786589743e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19458895921707153,
"step": 1460,
"valid_targets_mean": 5381.3,
"valid_targets_min": 727
},
{
"epoch": 2.1639586410635157,
"grad_norm": 0.3972438491459193,
"learning_rate": 3.491371974737105e-05,
"loss": 0.2172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19966194033622742,
"step": 1465,
"valid_targets_mean": 6120.7,
"valid_targets_min": 289
},
{
"epoch": 2.171344165435746,
"grad_norm": 0.4119929448789575,
"learning_rate": 3.486453933290321e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2048000693321228,
"step": 1470,
"valid_targets_mean": 5923.5,
"valid_targets_min": 695
},
{
"epoch": 2.178729689807976,
"grad_norm": 0.43265541786608985,
"learning_rate": 3.481515728959764e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19329239428043365,
"step": 1475,
"valid_targets_mean": 5209.0,
"valid_targets_min": 559
},
{
"epoch": 2.186115214180207,
"grad_norm": 0.726326713865377,
"learning_rate": 3.4765574287293064e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22369539737701416,
"step": 1480,
"valid_targets_mean": 3706.1,
"valid_targets_min": 348
},
{
"epoch": 2.193500738552437,
"grad_norm": 0.4285241209732484,
"learning_rate": 3.47157909985541e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1844395101070404,
"step": 1485,
"valid_targets_mean": 5193.9,
"valid_targets_min": 655
},
{
"epoch": 2.2008862629246675,
"grad_norm": 0.3568827709297404,
"learning_rate": 3.466580809866213e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16118377447128296,
"step": 1490,
"valid_targets_mean": 5637.3,
"valid_targets_min": 616
},
{
"epoch": 2.208271787296898,
"grad_norm": 0.40674844742126304,
"learning_rate": 3.461562626560613e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1650213599205017,
"step": 1495,
"valid_targets_mean": 5220.6,
"valid_targets_min": 578
},
{
"epoch": 2.2156573116691285,
"grad_norm": 0.40044238504347957,
"learning_rate": 3.456524618007352e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18922209739685059,
"step": 1500,
"valid_targets_mean": 5842.4,
"valid_targets_min": 680
},
{
"epoch": 2.2230428360413588,
"grad_norm": 0.46819866949961275,
"learning_rate": 3.451466852544087e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22434237599372864,
"step": 1505,
"valid_targets_mean": 4454.3,
"valid_targets_min": 585
},
{
"epoch": 2.2304283604135895,
"grad_norm": 0.358887635540945,
"learning_rate": 3.446389398776468e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16988348960876465,
"step": 1510,
"valid_targets_mean": 6279.1,
"valid_targets_min": 710
},
{
"epoch": 2.2378138847858198,
"grad_norm": 0.40829806216099035,
"learning_rate": 3.441292325577204e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1971379816532135,
"step": 1515,
"valid_targets_mean": 6296.1,
"valid_targets_min": 822
},
{
"epoch": 2.24519940915805,
"grad_norm": 0.40160684926373197,
"learning_rate": 3.436175702085132e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17605721950531006,
"step": 1520,
"valid_targets_mean": 5582.8,
"valid_targets_min": 486
},
{
"epoch": 2.2525849335302808,
"grad_norm": 0.5229993777219565,
"learning_rate": 3.431039597704275e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23692980408668518,
"step": 1525,
"valid_targets_mean": 4018.5,
"valid_targets_min": 479
},
{
"epoch": 2.259970457902511,
"grad_norm": 0.6849225115875504,
"learning_rate": 3.425884082102904e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28416967391967773,
"step": 1530,
"valid_targets_mean": 2544.4,
"valid_targets_min": 400
},
{
"epoch": 2.2673559822747413,
"grad_norm": 0.4227339555943465,
"learning_rate": 3.4207092252125934e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20092085003852844,
"step": 1535,
"valid_targets_mean": 5492.9,
"valid_targets_min": 654
},
{
"epoch": 2.274741506646972,
"grad_norm": 0.4345429425277249,
"learning_rate": 3.415515097227269e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21635641157627106,
"step": 1540,
"valid_targets_mean": 5030.1,
"valid_targets_min": 489
},
{
"epoch": 2.2821270310192023,
"grad_norm": 0.4693229139379586,
"learning_rate": 3.4103017686022584e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2364303320646286,
"step": 1545,
"valid_targets_mean": 4731.6,
"valid_targets_min": 562
},
{
"epoch": 2.2895125553914326,
"grad_norm": 0.38590061526432556,
"learning_rate": 3.4050693100533334e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16934344172477722,
"step": 1550,
"valid_targets_mean": 6597.2,
"valid_targets_min": 590
},
{
"epoch": 2.2968980797636633,
"grad_norm": 0.3661821378036947,
"learning_rate": 3.399817792555756e-05,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15037478506565094,
"step": 1555,
"valid_targets_mean": 5859.4,
"valid_targets_min": 620
},
{
"epoch": 2.3042836041358936,
"grad_norm": 0.5749118981748869,
"learning_rate": 3.394547287343307e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21516035497188568,
"step": 1560,
"valid_targets_mean": 3785.1,
"valid_targets_min": 308
},
{
"epoch": 2.311669128508124,
"grad_norm": 0.5222981613404089,
"learning_rate": 3.389257865907329e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672545909881592,
"step": 1565,
"valid_targets_mean": 4263.8,
"valid_targets_min": 562
},
{
"epoch": 2.3190546528803546,
"grad_norm": 0.39866742666796046,
"learning_rate": 3.383949599995747e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20826904475688934,
"step": 1570,
"valid_targets_mean": 6104.1,
"valid_targets_min": 490
},
{
"epoch": 2.326440177252585,
"grad_norm": 0.5020262347414661,
"learning_rate": 3.378622561612105e-05,
"loss": 0.2017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17644500732421875,
"step": 1575,
"valid_targets_mean": 4395.3,
"valid_targets_min": 535
},
{
"epoch": 2.333825701624815,
"grad_norm": 0.48126474522159196,
"learning_rate": 3.3732768230145834e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2069077491760254,
"step": 1580,
"valid_targets_mean": 4419.8,
"valid_targets_min": 617
},
{
"epoch": 2.341211225997046,
"grad_norm": 0.35388137699572986,
"learning_rate": 3.3679124567150195e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15227368474006653,
"step": 1585,
"valid_targets_mean": 6494.9,
"valid_targets_min": 682
},
{
"epoch": 2.348596750369276,
"grad_norm": 0.3840750165781411,
"learning_rate": 3.362529535477923e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.170127272605896,
"step": 1590,
"valid_targets_mean": 6790.0,
"valid_targets_min": 1006
},
{
"epoch": 2.3559822747415065,
"grad_norm": 0.5434507333346537,
"learning_rate": 3.357128132319494e-05,
"loss": 0.2114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20456504821777344,
"step": 1595,
"valid_targets_mean": 3017.6,
"valid_targets_min": 320
},
{
"epoch": 2.363367799113737,
"grad_norm": 0.4069694394082241,
"learning_rate": 3.3517083205066275e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19211331009864807,
"step": 1600,
"valid_targets_mean": 5513.6,
"valid_targets_min": 681
},
{
"epoch": 2.3707533234859675,
"grad_norm": 0.41784163330661017,
"learning_rate": 3.34627017355592e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18239319324493408,
"step": 1605,
"valid_targets_mean": 4941.2,
"valid_targets_min": 540
},
{
"epoch": 2.3781388478581977,
"grad_norm": 0.39238043020867075,
"learning_rate": 3.340813765232675e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1841011941432953,
"step": 1610,
"valid_targets_mean": 5700.5,
"valid_targets_min": 517
},
{
"epoch": 2.3855243722304285,
"grad_norm": 0.4201145604723071,
"learning_rate": 3.3353391695499e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20100927352905273,
"step": 1615,
"valid_targets_mean": 5057.5,
"valid_targets_min": 491
},
{
"epoch": 2.3929098966026587,
"grad_norm": 0.41846525077178565,
"learning_rate": 3.329846460767305e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20187963545322418,
"step": 1620,
"valid_targets_mean": 4845.5,
"valid_targets_min": 523
},
{
"epoch": 2.4002954209748895,
"grad_norm": 0.40798367807953856,
"learning_rate": 3.324335713390292e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15751047432422638,
"step": 1625,
"valid_targets_mean": 5196.8,
"valid_targets_min": 314
},
{
"epoch": 2.4076809453471197,
"grad_norm": 0.4061768747540575,
"learning_rate": 3.3188070021689464e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17988130450248718,
"step": 1630,
"valid_targets_mean": 5505.8,
"valid_targets_min": 605
},
{
"epoch": 2.41506646971935,
"grad_norm": 0.46242647917420265,
"learning_rate": 3.313260402097024e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2638862729072571,
"step": 1635,
"valid_targets_mean": 5006.3,
"valid_targets_min": 510
},
{
"epoch": 2.4224519940915803,
"grad_norm": 0.49810161190363844,
"learning_rate": 3.307695988410931e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2404661476612091,
"step": 1640,
"valid_targets_mean": 5057.5,
"valid_targets_min": 870
},
{
"epoch": 2.429837518463811,
"grad_norm": 0.49091951535741857,
"learning_rate": 3.302113836588705e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21287889778614044,
"step": 1645,
"valid_targets_mean": 3981.2,
"valid_targets_min": 336
},
{
"epoch": 2.4372230428360413,
"grad_norm": 0.570596929329595,
"learning_rate": 3.296514022348991e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22047343850135803,
"step": 1650,
"valid_targets_mean": 5769.9,
"valid_targets_min": 747
},
{
"epoch": 2.444608567208272,
"grad_norm": 0.45209355569835663,
"learning_rate": 3.2908966216500164e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17555588483810425,
"step": 1655,
"valid_targets_mean": 5262.3,
"valid_targets_min": 642
},
{
"epoch": 2.4519940915805023,
"grad_norm": 0.5750894848392384,
"learning_rate": 3.2852617106885554e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24034175276756287,
"step": 1660,
"valid_targets_mean": 2897.2,
"valid_targets_min": 553
},
{
"epoch": 2.4593796159527326,
"grad_norm": 0.44533416665746417,
"learning_rate": 3.279609365898903e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18521445989608765,
"step": 1665,
"valid_targets_mean": 4074.0,
"valid_targets_min": 559
},
{
"epoch": 2.466765140324963,
"grad_norm": 0.3666396515845462,
"learning_rate": 3.273939663951828e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1782068908214569,
"step": 1670,
"valid_targets_mean": 6837.4,
"valid_targets_min": 600
},
{
"epoch": 2.4741506646971936,
"grad_norm": 0.3899278710986994,
"learning_rate": 3.268252681753546e-05,
"loss": 0.2211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2376466989517212,
"step": 1675,
"valid_targets_mean": 6254.3,
"valid_targets_min": 784
},
{
"epoch": 2.481536189069424,
"grad_norm": 0.4081436844860877,
"learning_rate": 3.262548496444664e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19119364023208618,
"step": 1680,
"valid_targets_mean": 5165.9,
"valid_targets_min": 669
},
{
"epoch": 2.4889217134416546,
"grad_norm": 0.3782408782114525,
"learning_rate": 3.25682718539914e-05,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1731245368719101,
"step": 1685,
"valid_targets_mean": 6192.8,
"valid_targets_min": 844
},
{
"epoch": 2.496307237813885,
"grad_norm": 0.5214383122274813,
"learning_rate": 3.251088826223235e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2473294734954834,
"step": 1690,
"valid_targets_mean": 3865.7,
"valid_targets_min": 553
},
{
"epoch": 2.503692762186115,
"grad_norm": 0.48463478522919884,
"learning_rate": 3.245333496754455e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2620091736316681,
"step": 1695,
"valid_targets_mean": 4272.6,
"valid_targets_min": 713
},
{
"epoch": 2.5110782865583454,
"grad_norm": 0.48594394962497084,
"learning_rate": 3.239561275060501e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23510144650936127,
"step": 1700,
"valid_targets_mean": 4500.4,
"valid_targets_min": 516
},
{
"epoch": 2.518463810930576,
"grad_norm": 0.36026021621317095,
"learning_rate": 3.233772239438206e-05,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24801120162010193,
"step": 1705,
"valid_targets_mean": 7072.2,
"valid_targets_min": 775
},
{
"epoch": 2.5258493353028064,
"grad_norm": 0.5691361574973622,
"learning_rate": 3.2279664684124724e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24925799667835236,
"step": 1710,
"valid_targets_mean": 4504.7,
"valid_targets_min": 377
},
{
"epoch": 2.533234859675037,
"grad_norm": 0.399794469998823,
"learning_rate": 3.22214404073521e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16049984097480774,
"step": 1715,
"valid_targets_mean": 6125.9,
"valid_targets_min": 497
},
{
"epoch": 2.5406203840472674,
"grad_norm": 0.41442596267228626,
"learning_rate": 3.216305035384268e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17098268866539001,
"step": 1720,
"valid_targets_mean": 5603.4,
"valid_targets_min": 686
},
{
"epoch": 2.5480059084194977,
"grad_norm": 0.4162604595759132,
"learning_rate": 3.210449531562361e-05,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16771002113819122,
"step": 1725,
"valid_targets_mean": 4639.4,
"valid_targets_min": 552
},
{
"epoch": 2.555391432791728,
"grad_norm": 0.38874831725964026,
"learning_rate": 3.2045776086959945e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17640861868858337,
"step": 1730,
"valid_targets_mean": 5082.9,
"valid_targets_min": 125
},
{
"epoch": 2.5627769571639587,
"grad_norm": 0.36315151583426797,
"learning_rate": 3.1986893464343913e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1778927743434906,
"step": 1735,
"valid_targets_mean": 5937.7,
"valid_targets_min": 826
},
{
"epoch": 2.570162481536189,
"grad_norm": 0.44124180419701514,
"learning_rate": 3.192784824648405e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22931697964668274,
"step": 1740,
"valid_targets_mean": 4890.1,
"valid_targets_min": 436
},
{
"epoch": 2.5775480059084197,
"grad_norm": 0.4646453073195735,
"learning_rate": 3.186864123429443e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1924285590648651,
"step": 1745,
"valid_targets_mean": 4559.1,
"valid_targets_min": 626
},
{
"epoch": 2.58493353028065,
"grad_norm": 0.3769877916171565,
"learning_rate": 3.180927323088377e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19486212730407715,
"step": 1750,
"valid_targets_mean": 7005.6,
"valid_targets_min": 873
},
{
"epoch": 2.5923190546528803,
"grad_norm": 0.4122861646475437,
"learning_rate": 3.1749745041544535e-05,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1655203104019165,
"step": 1755,
"valid_targets_mean": 5165.2,
"valid_targets_min": 362
},
{
"epoch": 2.5997045790251105,
"grad_norm": 0.46795037129236655,
"learning_rate": 3.169005747374202e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.210823655128479,
"step": 1760,
"valid_targets_mean": 4634.7,
"valid_targets_min": 557
},
{
"epoch": 2.6070901033973413,
"grad_norm": 0.40305455364946613,
"learning_rate": 3.163021133710339e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19001798331737518,
"step": 1765,
"valid_targets_mean": 6316.5,
"valid_targets_min": 515
},
{
"epoch": 2.6144756277695715,
"grad_norm": 0.37687379981581354,
"learning_rate": 3.1570207443406715e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.156022310256958,
"step": 1770,
"valid_targets_mean": 5602.8,
"valid_targets_min": 636
},
{
"epoch": 2.6218611521418023,
"grad_norm": 0.41470758369539723,
"learning_rate": 3.1510046606569944e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1826784908771515,
"step": 1775,
"valid_targets_mean": 5436.1,
"valid_targets_min": 541
},
{
"epoch": 2.6292466765140325,
"grad_norm": 0.3852868541588975,
"learning_rate": 3.1449729642639856e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17214235663414001,
"step": 1780,
"valid_targets_mean": 5589.0,
"valid_targets_min": 475
},
{
"epoch": 2.636632200886263,
"grad_norm": 0.4088176838039698,
"learning_rate": 3.138925736978103e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18025021255016327,
"step": 1785,
"valid_targets_mean": 4904.5,
"valid_targets_min": 833
},
{
"epoch": 2.644017725258493,
"grad_norm": 0.4491076662753666,
"learning_rate": 3.132863060826469e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18313133716583252,
"step": 1790,
"valid_targets_mean": 4372.4,
"valid_targets_min": 504
},
{
"epoch": 2.651403249630724,
"grad_norm": 0.4132101343175699,
"learning_rate": 3.126785018045764e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18020716309547424,
"step": 1795,
"valid_targets_mean": 5285.4,
"valid_targets_min": 324
},
{
"epoch": 2.658788774002954,
"grad_norm": 0.6224525946031296,
"learning_rate": 3.120691691081104e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18289199471473694,
"step": 1800,
"valid_targets_mean": 5814.2,
"valid_targets_min": 712
},
{
"epoch": 2.666174298375185,
"grad_norm": 0.37344081795259465,
"learning_rate": 3.1145831625849315e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18605783581733704,
"step": 1805,
"valid_targets_mean": 6338.0,
"valid_targets_min": 708
},
{
"epoch": 2.673559822747415,
"grad_norm": 0.45469603573341405,
"learning_rate": 3.1084595154158814e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20985165238380432,
"step": 1810,
"valid_targets_mean": 4686.1,
"valid_targets_min": 694
},
{
"epoch": 2.6809453471196454,
"grad_norm": 0.42143425429690434,
"learning_rate": 3.1023208326376716e-05,
"loss": 0.2089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601705253124237,
"step": 1815,
"valid_targets_mean": 5887.0,
"valid_targets_min": 629
},
{
"epoch": 2.6883308714918757,
"grad_norm": 0.4566218104083272,
"learning_rate": 3.0961671975179674e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22524869441986084,
"step": 1820,
"valid_targets_mean": 5187.4,
"valid_targets_min": 425
},
{
"epoch": 2.6957163958641064,
"grad_norm": 0.45904018086003157,
"learning_rate": 3.08999869352725e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2111627757549286,
"step": 1825,
"valid_targets_mean": 4385.9,
"valid_targets_min": 476
},
{
"epoch": 2.7031019202363367,
"grad_norm": 0.3947587132525764,
"learning_rate": 3.0838154043376936e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1816597878932953,
"step": 1830,
"valid_targets_mean": 5509.4,
"valid_targets_min": 311
},
{
"epoch": 2.7104874446085674,
"grad_norm": 0.44429247184816495,
"learning_rate": 3.077617413822022e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16769450902938843,
"step": 1835,
"valid_targets_mean": 5723.1,
"valid_targets_min": 650
},
{
"epoch": 2.7178729689807977,
"grad_norm": 0.39766345484896237,
"learning_rate": 3.0714048060523745e-05,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.183930903673172,
"step": 1840,
"valid_targets_mean": 5270.6,
"valid_targets_min": 926
},
{
"epoch": 2.725258493353028,
"grad_norm": 0.36819777572651946,
"learning_rate": 3.065177665299166e-05,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18269002437591553,
"step": 1845,
"valid_targets_mean": 6104.4,
"valid_targets_min": 573
},
{
"epoch": 2.7326440177252582,
"grad_norm": 0.656642708317576,
"learning_rate": 3.0589360760299416e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2284368872642517,
"step": 1850,
"valid_targets_mean": 4357.9,
"valid_targets_min": 457
},
{
"epoch": 2.740029542097489,
"grad_norm": 0.40389665086925014,
"learning_rate": 3.052680122908232e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856120228767395,
"step": 1855,
"valid_targets_mean": 4957.6,
"valid_targets_min": 529
},
{
"epoch": 2.7474150664697192,
"grad_norm": 0.34197083654429966,
"learning_rate": 3.046409890792406e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15076898038387299,
"step": 1860,
"valid_targets_mean": 5943.9,
"valid_targets_min": 490
},
{
"epoch": 2.75480059084195,
"grad_norm": 0.39694434070650186,
"learning_rate": 3.040125464734519e-05,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22727245092391968,
"step": 1865,
"valid_targets_mean": 6380.9,
"valid_targets_min": 611
},
{
"epoch": 2.7621861152141802,
"grad_norm": 0.48955312172318344,
"learning_rate": 3.0338269299791573e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18965637683868408,
"step": 1870,
"valid_targets_mean": 4740.5,
"valid_targets_min": 595
},
{
"epoch": 2.7695716395864105,
"grad_norm": 0.498553979771601,
"learning_rate": 3.0275143719622853e-05,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18993785977363586,
"step": 1875,
"valid_targets_mean": 6250.0,
"valid_targets_min": 790
},
{
"epoch": 2.7769571639586412,
"grad_norm": 0.4680949760689842,
"learning_rate": 3.0211878763100836e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19833850860595703,
"step": 1880,
"valid_targets_mean": 4042.8,
"valid_targets_min": 639
},
{
"epoch": 2.7843426883308715,
"grad_norm": 0.6983614556096809,
"learning_rate": 3.0148475288377896e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18655887246131897,
"step": 1885,
"valid_targets_mean": 5421.7,
"valid_targets_min": 761
},
{
"epoch": 2.791728212703102,
"grad_norm": 0.3993729610123753,
"learning_rate": 3.0084934155485315e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17627528309822083,
"step": 1890,
"valid_targets_mean": 5305.3,
"valid_targets_min": 598
},
{
"epoch": 2.7991137370753325,
"grad_norm": 0.3486684335819875,
"learning_rate": 3.0021256226321643e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17181184887886047,
"step": 1895,
"valid_targets_mean": 6981.1,
"valid_targets_min": 461
},
{
"epoch": 2.806499261447563,
"grad_norm": 0.3996801724597566,
"learning_rate": 2.995744236464098e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19423222541809082,
"step": 1900,
"valid_targets_mean": 5607.2,
"valid_targets_min": 658
},
{
"epoch": 2.813884785819793,
"grad_norm": 0.4684471879315951,
"learning_rate": 2.9893493436041274e-05,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2360610067844391,
"step": 1905,
"valid_targets_mean": 4200.7,
"valid_targets_min": 726
},
{
"epoch": 2.821270310192024,
"grad_norm": 0.5224516946852575,
"learning_rate": 2.9829410307952577e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18097460269927979,
"step": 1910,
"valid_targets_mean": 5226.1,
"valid_targets_min": 453
},
{
"epoch": 2.828655834564254,
"grad_norm": 0.3919890597149292,
"learning_rate": 2.9765193849625283e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16534635424613953,
"step": 1915,
"valid_targets_mean": 5494.3,
"valid_targets_min": 459
},
{
"epoch": 2.8360413589364843,
"grad_norm": 0.3195931232516741,
"learning_rate": 2.9700844932118334e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442551165819168,
"step": 1920,
"valid_targets_mean": 6732.5,
"valid_targets_min": 614
},
{
"epoch": 2.843426883308715,
"grad_norm": 0.42131927060359514,
"learning_rate": 2.9636364428287395e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19797298312187195,
"step": 1925,
"valid_targets_mean": 4944.9,
"valid_targets_min": 456
},
{
"epoch": 2.8508124076809453,
"grad_norm": 0.3873317542623266,
"learning_rate": 2.9571753212773028e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17931729555130005,
"step": 1930,
"valid_targets_mean": 5626.6,
"valid_targets_min": 496
},
{
"epoch": 2.8581979320531756,
"grad_norm": 0.4030896596505125,
"learning_rate": 2.9507012161988827e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17033201456069946,
"step": 1935,
"valid_targets_mean": 6326.3,
"valid_targets_min": 768
},
{
"epoch": 2.8655834564254064,
"grad_norm": 0.4444109946556492,
"learning_rate": 2.9442142154109522e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1885213851928711,
"step": 1940,
"valid_targets_mean": 5517.4,
"valid_targets_min": 802
},
{
"epoch": 2.8729689807976366,
"grad_norm": 0.46145234382410805,
"learning_rate": 2.937714406905906e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20272204279899597,
"step": 1945,
"valid_targets_mean": 5488.1,
"valid_targets_min": 656
},
{
"epoch": 2.880354505169867,
"grad_norm": 0.42923087358401046,
"learning_rate": 2.9312018788498714e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19835910201072693,
"step": 1950,
"valid_targets_mean": 4609.9,
"valid_targets_min": 246
},
{
"epoch": 2.8877400295420976,
"grad_norm": 0.36880559499022475,
"learning_rate": 2.924676719581506e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19959020614624023,
"step": 1955,
"valid_targets_mean": 7206.6,
"valid_targets_min": 337
},
{
"epoch": 2.895125553914328,
"grad_norm": 0.3694784724494498,
"learning_rate": 2.9181390176108024e-05,
"loss": 0.1957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16610810160636902,
"step": 1960,
"valid_targets_mean": 5820.9,
"valid_targets_min": 743
},
{
"epoch": 2.902511078286558,
"grad_norm": 0.3748352447951345,
"learning_rate": 2.911588861617889e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1821543574333191,
"step": 1965,
"valid_targets_mean": 6034.1,
"valid_targets_min": 257
},
{
"epoch": 2.909896602658789,
"grad_norm": 0.46557987222831126,
"learning_rate": 2.9050263404518254e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896730303764343,
"step": 1970,
"valid_targets_mean": 5670.9,
"valid_targets_min": 664
},
{
"epoch": 2.917282127031019,
"grad_norm": 0.45582660198656316,
"learning_rate": 2.8984515431293982e-05,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21186470985412598,
"step": 1975,
"valid_targets_mean": 5415.5,
"valid_targets_min": 511
},
{
"epoch": 2.9246676514032495,
"grad_norm": 0.39058091819087787,
"learning_rate": 2.89186455883391e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18955285847187042,
"step": 1980,
"valid_targets_mean": 5434.4,
"valid_targets_min": 675
},
{
"epoch": 2.93205317577548,
"grad_norm": 0.38016760545252115,
"learning_rate": 2.8852654769139774e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.243728905916214,
"step": 1985,
"valid_targets_mean": 6925.2,
"valid_targets_min": 673
},
{
"epoch": 2.9394387001477105,
"grad_norm": 0.546712089772061,
"learning_rate": 2.8786543868823104e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17349129915237427,
"step": 1990,
"valid_targets_mean": 4468.9,
"valid_targets_min": 543
},
{
"epoch": 2.9468242245199407,
"grad_norm": 0.4515115845526151,
"learning_rate": 2.8720313784145036e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20189234614372253,
"step": 1995,
"valid_targets_mean": 4474.2,
"valid_targets_min": 495
},
{
"epoch": 2.9542097488921715,
"grad_norm": 0.3831876618295643,
"learning_rate": 2.865396541347818e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15678755939006805,
"step": 2000,
"valid_targets_mean": 4760.3,
"valid_targets_min": 370
},
{
"epoch": 2.9615952732644018,
"grad_norm": 0.40740457187470347,
"learning_rate": 2.8587499656799624e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17568612098693848,
"step": 2005,
"valid_targets_mean": 4997.9,
"valid_targets_min": 742
},
{
"epoch": 2.9689807976366325,
"grad_norm": 0.3735878296428736,
"learning_rate": 2.852091741567874e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21047380566596985,
"step": 2010,
"valid_targets_mean": 6746.7,
"valid_targets_min": 587
},
{
"epoch": 2.9763663220088628,
"grad_norm": 0.4064437208033243,
"learning_rate": 2.8454219593264924e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168643057346344,
"step": 2015,
"valid_targets_mean": 5444.5,
"valid_targets_min": 282
},
{
"epoch": 2.983751846381093,
"grad_norm": 0.4221057265749455,
"learning_rate": 2.8387407094275378e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20394739508628845,
"step": 2020,
"valid_targets_mean": 5266.9,
"valid_targets_min": 790
},
{
"epoch": 2.9911373707533233,
"grad_norm": 0.35734323137197604,
"learning_rate": 2.8320480824982836e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15881027281284332,
"step": 2025,
"valid_targets_mean": 5607.5,
"valid_targets_min": 572
},
{
"epoch": 2.998522895125554,
"grad_norm": 0.40362443061193043,
"learning_rate": 2.825344169320323e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19752827286720276,
"step": 2030,
"valid_targets_mean": 5551.8,
"valid_targets_min": 636
},
{
"epoch": 3.0059084194977843,
"grad_norm": 0.3483325395168603,
"learning_rate": 2.818629060828344e-05,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15444116294384003,
"step": 2035,
"valid_targets_mean": 6590.1,
"valid_targets_min": 2768
},
{
"epoch": 3.0132939438700146,
"grad_norm": 0.46266772441200416,
"learning_rate": 2.811902848108889e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18906280398368835,
"step": 2040,
"valid_targets_mean": 4889.4,
"valid_targets_min": 873
},
{
"epoch": 3.0206794682422453,
"grad_norm": 0.41227568999635833,
"learning_rate": 2.8051656223991274e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16269494593143463,
"step": 2045,
"valid_targets_mean": 5567.1,
"valid_targets_min": 616
},
{
"epoch": 3.0280649926144756,
"grad_norm": 0.46419141803047215,
"learning_rate": 2.798417475085608e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1930653154850006,
"step": 2050,
"valid_targets_mean": 5456.0,
"valid_targets_min": 708
},
{
"epoch": 3.035450516986706,
"grad_norm": 0.4383446251656798,
"learning_rate": 2.791658497703029e-05,
"loss": 0.1809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18855616450309753,
"step": 2055,
"valid_targets_mean": 5512.9,
"valid_targets_min": 571
},
{
"epoch": 3.0428360413589366,
"grad_norm": 0.37011575013943987,
"learning_rate": 2.7848887819329903e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16166454553604126,
"step": 2060,
"valid_targets_mean": 6532.8,
"valid_targets_min": 1512
},
{
"epoch": 3.050221565731167,
"grad_norm": 0.40311646790756955,
"learning_rate": 2.7781084196027527e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19137972593307495,
"step": 2065,
"valid_targets_mean": 5962.6,
"valid_targets_min": 564
},
{
"epoch": 3.057607090103397,
"grad_norm": 0.4275359756981932,
"learning_rate": 2.7713175026839905e-05,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21499311923980713,
"step": 2070,
"valid_targets_mean": 5277.0,
"valid_targets_min": 709
},
{
"epoch": 3.064992614475628,
"grad_norm": 0.3752504219955399,
"learning_rate": 2.7645161232915444e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16594503819942474,
"step": 2075,
"valid_targets_mean": 6164.9,
"valid_targets_min": 432
},
{
"epoch": 3.072378138847858,
"grad_norm": 0.4882106097565124,
"learning_rate": 2.7577043736821748e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21406424045562744,
"step": 2080,
"valid_targets_mean": 4252.2,
"valid_targets_min": 625
},
{
"epoch": 3.0797636632200884,
"grad_norm": 0.3525875278030082,
"learning_rate": 2.750882346253305e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13793540000915527,
"step": 2085,
"valid_targets_mean": 6917.0,
"valid_targets_min": 778
},
{
"epoch": 3.087149187592319,
"grad_norm": 0.4320447754658649,
"learning_rate": 2.7440501335417748e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1812410056591034,
"step": 2090,
"valid_targets_mean": 5966.3,
"valid_targets_min": 497
},
{
"epoch": 3.0945347119645494,
"grad_norm": 0.5117110061423488,
"learning_rate": 2.7372078282225772e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2231147289276123,
"step": 2095,
"valid_targets_mean": 4128.2,
"valid_targets_min": 540
},
{
"epoch": 3.1019202363367797,
"grad_norm": 0.4095198035952486,
"learning_rate": 2.730355523107608e-05,
"loss": 0.1735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16321970522403717,
"step": 2100,
"valid_targets_mean": 5197.5,
"valid_targets_min": 461
},
{
"epoch": 3.1093057607090104,
"grad_norm": 0.47545224234959904,
"learning_rate": 2.7234933111444046e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16089124977588654,
"step": 2105,
"valid_targets_mean": 3588.7,
"valid_targets_min": 322
},
{
"epoch": 3.1166912850812407,
"grad_norm": 0.3910891142579986,
"learning_rate": 2.7166212854148838e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2100703865289688,
"step": 2110,
"valid_targets_mean": 6335.6,
"valid_targets_min": 708
},
{
"epoch": 3.124076809453471,
"grad_norm": 0.4204297819786424,
"learning_rate": 2.709739539134081e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17549830675125122,
"step": 2115,
"valid_targets_mean": 4854.4,
"valid_targets_min": 803
},
{
"epoch": 3.1314623338257017,
"grad_norm": 0.4084245651713014,
"learning_rate": 2.7028481656488856e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15884898602962494,
"step": 2120,
"valid_targets_mean": 4327.5,
"valid_targets_min": 546
},
{
"epoch": 3.138847858197932,
"grad_norm": 0.5289348550596176,
"learning_rate": 2.6959472584367737e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18101103603839874,
"step": 2125,
"valid_targets_mean": 4410.6,
"valid_targets_min": 696
},
{
"epoch": 3.1462333825701623,
"grad_norm": 0.4419683145308729,
"learning_rate": 2.689036911104542e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24032284319400787,
"step": 2130,
"valid_targets_mean": 5461.6,
"valid_targets_min": 730
},
{
"epoch": 3.153618906942393,
"grad_norm": 0.7124574698928174,
"learning_rate": 2.6821172173870355e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15942493081092834,
"step": 2135,
"valid_targets_mean": 5982.3,
"valid_targets_min": 228
},
{
"epoch": 3.1610044313146233,
"grad_norm": 0.4691946439142087,
"learning_rate": 2.6751882711458783e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16036120057106018,
"step": 2140,
"valid_targets_mean": 4745.8,
"valid_targets_min": 652
},
{
"epoch": 3.1683899556868536,
"grad_norm": 0.3657559670571617,
"learning_rate": 2.6682501663682e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16519255936145782,
"step": 2145,
"valid_targets_mean": 6309.1,
"valid_targets_min": 684
},
{
"epoch": 3.1757754800590843,
"grad_norm": 0.4525601076810765,
"learning_rate": 2.661302997165359e-05,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16392679512500763,
"step": 2150,
"valid_targets_mean": 4315.6,
"valid_targets_min": 598
},
{
"epoch": 3.1831610044313146,
"grad_norm": 0.4756846684204359,
"learning_rate": 2.6543468577716694e-05,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2014717161655426,
"step": 2155,
"valid_targets_mean": 4423.4,
"valid_targets_min": 594
},
{
"epoch": 3.1905465288035453,
"grad_norm": 0.4270410035428385,
"learning_rate": 2.6473818425431185e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542786955833435,
"step": 2160,
"valid_targets_mean": 5105.6,
"valid_targets_min": 348
},
{
"epoch": 3.1979320531757756,
"grad_norm": 0.4702062705925336,
"learning_rate": 2.640408045956091e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19304950535297394,
"step": 2165,
"valid_targets_mean": 4532.8,
"valid_targets_min": 674
},
{
"epoch": 3.205317577548006,
"grad_norm": 0.45151853190869246,
"learning_rate": 2.6334255626060842e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19992440938949585,
"step": 2170,
"valid_targets_mean": 4673.7,
"valid_targets_min": 658
},
{
"epoch": 3.212703101920236,
"grad_norm": 0.42434196985334355,
"learning_rate": 2.626434487206428e-05,
"loss": 0.1763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18652237951755524,
"step": 2175,
"valid_targets_mean": 5400.8,
"valid_targets_min": 528
},
{
"epoch": 3.220088626292467,
"grad_norm": 0.4063121122695259,
"learning_rate": 2.6194349145869965e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16594845056533813,
"step": 2180,
"valid_targets_mean": 5230.7,
"valid_targets_min": 369
},
{
"epoch": 3.227474150664697,
"grad_norm": 0.447772859466632,
"learning_rate": 2.6124269396929256e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17529018223285675,
"step": 2185,
"valid_targets_mean": 4556.4,
"valid_targets_min": 562
},
{
"epoch": 3.234859675036928,
"grad_norm": 0.40325224428720596,
"learning_rate": 2.6054106575833206e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18165422976016998,
"step": 2190,
"valid_targets_mean": 5751.3,
"valid_targets_min": 644
},
{
"epoch": 3.242245199409158,
"grad_norm": 0.4248179861853043,
"learning_rate": 2.5983861634299715e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15987026691436768,
"step": 2195,
"valid_targets_mean": 5245.4,
"valid_targets_min": 605
},
{
"epoch": 3.2496307237813884,
"grad_norm": 0.43315325209313854,
"learning_rate": 2.5913535525160608e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19797955453395844,
"step": 2200,
"valid_targets_mean": 5092.6,
"valid_targets_min": 595
},
{
"epoch": 3.2570162481536187,
"grad_norm": 0.45899763861106463,
"learning_rate": 2.5843129202348666e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1837209016084671,
"step": 2205,
"valid_targets_mean": 5431.0,
"valid_targets_min": 905
},
{
"epoch": 3.2644017725258494,
"grad_norm": 0.34185089958623904,
"learning_rate": 2.577264362088475e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12556633353233337,
"step": 2210,
"valid_targets_mean": 6299.7,
"valid_targets_min": 521
},
{
"epoch": 3.2717872968980797,
"grad_norm": 0.41205572297039716,
"learning_rate": 2.5702079736864815e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16507720947265625,
"step": 2215,
"valid_targets_mean": 5128.1,
"valid_targets_min": 821
},
{
"epoch": 3.2791728212703104,
"grad_norm": 0.3997869068309829,
"learning_rate": 2.5631438507446936e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1773259937763214,
"step": 2220,
"valid_targets_mean": 5669.0,
"valid_targets_min": 665
},
{
"epoch": 3.2865583456425407,
"grad_norm": 0.4984598466794601,
"learning_rate": 2.5560720890838332e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2146761119365692,
"step": 2225,
"valid_targets_mean": 4352.7,
"valid_targets_min": 648
},
{
"epoch": 3.293943870014771,
"grad_norm": 0.47607510524209484,
"learning_rate": 2.5489927846282386e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1854625642299652,
"step": 2230,
"valid_targets_mean": 4233.4,
"valid_targets_min": 504
},
{
"epoch": 3.3013293943870012,
"grad_norm": 0.4239465864105787,
"learning_rate": 2.5419060334045606e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17958292365074158,
"step": 2235,
"valid_targets_mean": 5336.4,
"valid_targets_min": 674
},
{
"epoch": 3.308714918759232,
"grad_norm": 0.4619161542340498,
"learning_rate": 2.5348119315404604e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17576739192008972,
"step": 2240,
"valid_targets_mean": 5028.8,
"valid_targets_min": 572
},
{
"epoch": 3.3161004431314622,
"grad_norm": 0.37782695093104735,
"learning_rate": 2.5277105752633083e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1741185039281845,
"step": 2245,
"valid_targets_mean": 5921.9,
"valid_targets_min": 425
},
{
"epoch": 3.323485967503693,
"grad_norm": 0.46105586751392597,
"learning_rate": 2.520602060898874e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2181580513715744,
"step": 2250,
"valid_targets_mean": 4782.2,
"valid_targets_min": 785
},
{
"epoch": 3.3308714918759232,
"grad_norm": 0.44233045621174916,
"learning_rate": 2.5134864848700247e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21820692718029022,
"step": 2255,
"valid_targets_mean": 5393.2,
"valid_targets_min": 628
},
{
"epoch": 3.3382570162481535,
"grad_norm": 0.4176926479653841,
"learning_rate": 2.5063639436954145e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2524767518043518,
"step": 2260,
"valid_targets_mean": 6778.2,
"valid_targets_min": 609
},
{
"epoch": 3.345642540620384,
"grad_norm": 0.3785623480657544,
"learning_rate": 2.499234533988174e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15883594751358032,
"step": 2265,
"valid_targets_mean": 6011.2,
"valid_targets_min": 541
},
{
"epoch": 3.3530280649926145,
"grad_norm": 0.9489103748663574,
"learning_rate": 2.4920983524546035e-05,
"loss": 0.1826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19622023403644562,
"step": 2270,
"valid_targets_mean": 2849.2,
"valid_targets_min": 336
},
{
"epoch": 3.360413589364845,
"grad_norm": 0.4851485979634193,
"learning_rate": 2.4849554958928582e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1570294201374054,
"step": 2275,
"valid_targets_mean": 4828.0,
"valid_targets_min": 533
},
{
"epoch": 3.3677991137370755,
"grad_norm": 0.38871049650595657,
"learning_rate": 2.477806061191637e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16449853777885437,
"step": 2280,
"valid_targets_mean": 6279.4,
"valid_targets_min": 623
},
{
"epoch": 3.375184638109306,
"grad_norm": 0.3846163906395918,
"learning_rate": 2.4706501453288656e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17619986832141876,
"step": 2285,
"valid_targets_mean": 5938.9,
"valid_targets_min": 718
},
{
"epoch": 3.382570162481536,
"grad_norm": 0.4036981390266134,
"learning_rate": 2.4634878453703857e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16103024780750275,
"step": 2290,
"valid_targets_mean": 5504.4,
"valid_targets_min": 1317
},
{
"epoch": 3.389955686853767,
"grad_norm": 0.6582445011580204,
"learning_rate": 2.4563192584686325e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.192658931016922,
"step": 2295,
"valid_targets_mean": 3992.2,
"valid_targets_min": 602
},
{
"epoch": 3.397341211225997,
"grad_norm": 0.37316580719925574,
"learning_rate": 2.4491444818613218e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514277458190918,
"step": 2300,
"valid_targets_mean": 6166.7,
"valid_targets_min": 493
},
{
"epoch": 3.4047267355982274,
"grad_norm": 0.36651337529440386,
"learning_rate": 2.441963612870129e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17430251836776733,
"step": 2305,
"valid_targets_mean": 6701.6,
"valid_targets_min": 1299
},
{
"epoch": 3.412112259970458,
"grad_norm": 0.4562920402638719,
"learning_rate": 2.4347767488993697e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17882443964481354,
"step": 2310,
"valid_targets_mean": 4928.1,
"valid_targets_min": 677
},
{
"epoch": 3.4194977843426884,
"grad_norm": 0.40217427857200977,
"learning_rate": 2.4275839874346757e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21625502407550812,
"step": 2315,
"valid_targets_mean": 5914.1,
"valid_targets_min": 642
},
{
"epoch": 3.4268833087149186,
"grad_norm": 0.4676729858346907,
"learning_rate": 2.4203854260416764e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18612849712371826,
"step": 2320,
"valid_targets_mean": 4202.7,
"valid_targets_min": 513
},
{
"epoch": 3.4342688330871494,
"grad_norm": 0.5053850543812328,
"learning_rate": 2.4131811623646745e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20099109411239624,
"step": 2325,
"valid_targets_mean": 5066.5,
"valid_targets_min": 799
},
{
"epoch": 3.4416543574593796,
"grad_norm": 0.4177536175359703,
"learning_rate": 2.4059712941253205e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17040522396564484,
"step": 2330,
"valid_targets_mean": 6019.4,
"valid_targets_min": 622
},
{
"epoch": 3.44903988183161,
"grad_norm": 0.3896994204855158,
"learning_rate": 2.3987559191212855e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17240211367607117,
"step": 2335,
"valid_targets_mean": 5771.4,
"valid_targets_min": 820
},
{
"epoch": 3.4564254062038406,
"grad_norm": 0.4519987685160109,
"learning_rate": 2.3915351352249392e-05,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.194617360830307,
"step": 2340,
"valid_targets_mean": 4527.7,
"valid_targets_min": 726
},
{
"epoch": 3.463810930576071,
"grad_norm": 0.5253399465778659,
"learning_rate": 2.3843090403820198e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16879601776599884,
"step": 2345,
"valid_targets_mean": 6142.8,
"valid_targets_min": 451
},
{
"epoch": 3.471196454948301,
"grad_norm": 0.4277432003720903,
"learning_rate": 2.3770777326103033e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18401449918746948,
"step": 2350,
"valid_targets_mean": 5573.9,
"valid_targets_min": 477
},
{
"epoch": 3.478581979320532,
"grad_norm": 0.4257500742732944,
"learning_rate": 2.3698413099982772e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23105338215827942,
"step": 2355,
"valid_targets_mean": 6022.1,
"valid_targets_min": 577
},
{
"epoch": 3.485967503692762,
"grad_norm": 0.35202882188870804,
"learning_rate": 2.3625998707038095e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15384787321090698,
"step": 2360,
"valid_targets_mean": 6247.2,
"valid_targets_min": 743
},
{
"epoch": 3.4933530280649925,
"grad_norm": 0.5362069711243463,
"learning_rate": 2.355353512952816e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501859962940216,
"step": 2365,
"valid_targets_mean": 3637.5,
"valid_targets_min": 557
},
{
"epoch": 3.500738552437223,
"grad_norm": 0.627740196350393,
"learning_rate": 2.3481023350379282e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972651183605194,
"step": 2370,
"valid_targets_mean": 3431.4,
"valid_targets_min": 298
},
{
"epoch": 3.5081240768094535,
"grad_norm": 0.42738807000739665,
"learning_rate": 2.3408464353171603e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17980587482452393,
"step": 2375,
"valid_targets_mean": 4957.2,
"valid_targets_min": 606
},
{
"epoch": 3.5155096011816838,
"grad_norm": 0.4123970309337914,
"learning_rate": 2.3335859122125762e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1853245347738266,
"step": 2380,
"valid_targets_mean": 4892.4,
"valid_targets_min": 658
},
{
"epoch": 3.5228951255539145,
"grad_norm": 0.42163919981185066,
"learning_rate": 2.3263208642089517e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15585747361183167,
"step": 2385,
"valid_targets_mean": 4967.4,
"valid_targets_min": 606
},
{
"epoch": 3.5302806499261448,
"grad_norm": 0.3631774625240425,
"learning_rate": 2.319051389852441e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15152710676193237,
"step": 2390,
"valid_targets_mean": 6531.5,
"valid_targets_min": 526
},
{
"epoch": 3.537666174298375,
"grad_norm": 0.4386225168817978,
"learning_rate": 2.311777587749239e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17836642265319824,
"step": 2395,
"valid_targets_mean": 5189.2,
"valid_targets_min": 400
},
{
"epoch": 3.5450516986706058,
"grad_norm": 0.37272488284870037,
"learning_rate": 2.3044995565642453e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15524575114250183,
"step": 2400,
"valid_targets_mean": 5844.1,
"valid_targets_min": 323
},
{
"epoch": 3.552437223042836,
"grad_norm": 0.4273954739176906,
"learning_rate": 2.2972173950197223e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19005119800567627,
"step": 2405,
"valid_targets_mean": 5287.6,
"valid_targets_min": 522
},
{
"epoch": 3.5598227474150663,
"grad_norm": 0.3809128573118705,
"learning_rate": 2.2899312018939598e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16557791829109192,
"step": 2410,
"valid_targets_mean": 5387.4,
"valid_targets_min": 424
},
{
"epoch": 3.567208271787297,
"grad_norm": 0.445270409658121,
"learning_rate": 2.2826410760199327e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16389130055904388,
"step": 2415,
"valid_targets_mean": 6058.5,
"valid_targets_min": 699
},
{
"epoch": 3.5745937961595273,
"grad_norm": 0.7167965047318506,
"learning_rate": 2.2753471162839637e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20100605487823486,
"step": 2420,
"valid_targets_mean": 6238.5,
"valid_targets_min": 567
},
{
"epoch": 3.5819793205317576,
"grad_norm": 0.44061592794128485,
"learning_rate": 2.2680494216243762e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20798034965991974,
"step": 2425,
"valid_targets_mean": 5419.6,
"valid_targets_min": 628
},
{
"epoch": 3.5893648449039883,
"grad_norm": 0.39676272392212464,
"learning_rate": 2.2607480910301564e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18191611766815186,
"step": 2430,
"valid_targets_mean": 6013.3,
"valid_targets_min": 704
},
{
"epoch": 3.5967503692762186,
"grad_norm": 0.38941782318875595,
"learning_rate": 2.253443223539613e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17795924842357635,
"step": 2435,
"valid_targets_mean": 5669.7,
"valid_targets_min": 647
},
{
"epoch": 3.604135893648449,
"grad_norm": 0.3942812475735809,
"learning_rate": 2.246134918239028e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1445077508687973,
"step": 2440,
"valid_targets_mean": 5918.6,
"valid_targets_min": 641
},
{
"epoch": 3.6115214180206796,
"grad_norm": 0.3878199914386221,
"learning_rate": 2.2388232742613146e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15950973331928253,
"step": 2445,
"valid_targets_mean": 5599.8,
"valid_targets_min": 462
},
{
"epoch": 3.61890694239291,
"grad_norm": 0.40119193945091164,
"learning_rate": 2.231508390784674e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18693730235099792,
"step": 2450,
"valid_targets_mean": 5479.7,
"valid_targets_min": 683
},
{
"epoch": 3.62629246676514,
"grad_norm": 0.41270041132362517,
"learning_rate": 2.2241903670312516e-05,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751289963722229,
"step": 2455,
"valid_targets_mean": 6304.4,
"valid_targets_min": 729
},
{
"epoch": 3.633677991137371,
"grad_norm": 0.37919593321209355,
"learning_rate": 2.216869302265785e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.180336594581604,
"step": 2460,
"valid_targets_mean": 6089.2,
"valid_targets_min": 683
},
{
"epoch": 3.641063515509601,
"grad_norm": 0.41713272138692914,
"learning_rate": 2.2095452957942643e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17298147082328796,
"step": 2465,
"valid_targets_mean": 5199.1,
"valid_targets_min": 547
},
{
"epoch": 3.6484490398818314,
"grad_norm": 0.5197567957007619,
"learning_rate": 2.2022184469625797e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1868414729833603,
"step": 2470,
"valid_targets_mean": 4258.9,
"valid_targets_min": 620
},
{
"epoch": 3.655834564254062,
"grad_norm": 0.39404420347224917,
"learning_rate": 2.1948888551551795e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16973114013671875,
"step": 2475,
"valid_targets_mean": 5702.5,
"valid_targets_min": 528
},
{
"epoch": 3.6632200886262924,
"grad_norm": 0.49672107594538334,
"learning_rate": 2.1875566197937154e-05,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22505685687065125,
"step": 2480,
"valid_targets_mean": 4229.1,
"valid_targets_min": 614
},
{
"epoch": 3.670605612998523,
"grad_norm": 0.5386862158554978,
"learning_rate": 2.1802218403357003e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18474605679512024,
"step": 2485,
"valid_targets_mean": 3811.4,
"valid_targets_min": 608
},
{
"epoch": 3.6779911373707534,
"grad_norm": 0.4199309274764877,
"learning_rate": 2.1728846162731547e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16229534149169922,
"step": 2490,
"valid_targets_mean": 4422.1,
"valid_targets_min": 602
},
{
"epoch": 3.6853766617429837,
"grad_norm": 0.44213788636825774,
"learning_rate": 2.1655450471312587e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16909149289131165,
"step": 2495,
"valid_targets_mean": 4642.9,
"valid_targets_min": 670
},
{
"epoch": 3.692762186115214,
"grad_norm": 0.47756920378888834,
"learning_rate": 2.1582032324670024e-05,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21273420751094818,
"step": 2500,
"valid_targets_mean": 4483.9,
"valid_targets_min": 573
},
{
"epoch": 3.7001477104874447,
"grad_norm": 1.7776796913692625,
"learning_rate": 2.150859271867836e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20686309039592743,
"step": 2505,
"valid_targets_mean": 3814.2,
"valid_targets_min": 282
},
{
"epoch": 3.707533234859675,
"grad_norm": 0.4541222702170866,
"learning_rate": 2.143513264950316e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16933034360408783,
"step": 2510,
"valid_targets_mean": 4283.7,
"valid_targets_min": 360
},
{
"epoch": 3.7149187592319057,
"grad_norm": 0.512488878559065,
"learning_rate": 2.1361653113587583e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23736466467380524,
"step": 2515,
"valid_targets_mean": 4091.1,
"valid_targets_min": 553
},
{
"epoch": 3.722304283604136,
"grad_norm": 0.5026024047876461,
"learning_rate": 2.128815510763882e-05,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19661220908164978,
"step": 2520,
"valid_targets_mean": 3568.8,
"valid_targets_min": 479
},
{
"epoch": 3.7296898079763663,
"grad_norm": 0.4756178800621908,
"learning_rate": 2.1214639628614618e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2067551612854004,
"step": 2525,
"valid_targets_mean": 4420.6,
"valid_targets_min": 535
},
{
"epoch": 3.7370753323485966,
"grad_norm": 0.4481991423508541,
"learning_rate": 2.1141107673709727e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2029070109128952,
"step": 2530,
"valid_targets_mean": 4889.3,
"valid_targets_min": 671
},
{
"epoch": 3.7444608567208273,
"grad_norm": 0.4486218822810619,
"learning_rate": 2.1067560240342382e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19874705374240875,
"step": 2535,
"valid_targets_mean": 4725.5,
"valid_targets_min": 309
},
{
"epoch": 3.7518463810930576,
"grad_norm": 0.42580796837346163,
"learning_rate": 2.0993998326140774e-05,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17727911472320557,
"step": 2540,
"valid_targets_mean": 4696.8,
"valid_targets_min": 629
},
{
"epoch": 3.7592319054652883,
"grad_norm": 0.46276463063827256,
"learning_rate": 2.0920422928929514e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21701931953430176,
"step": 2545,
"valid_targets_mean": 5121.4,
"valid_targets_min": 620
},
{
"epoch": 3.7666174298375186,
"grad_norm": 0.39520678275058635,
"learning_rate": 2.0846835046716124e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2055937796831131,
"step": 2550,
"valid_targets_mean": 6235.9,
"valid_targets_min": 743
},
{
"epoch": 3.774002954209749,
"grad_norm": 0.3749059071380504,
"learning_rate": 2.0773235677677453e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1439509242773056,
"step": 2555,
"valid_targets_mean": 5177.5,
"valid_targets_min": 601
},
{
"epoch": 3.781388478581979,
"grad_norm": 0.4376582038796636,
"learning_rate": 2.0699625820146166e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19691312313079834,
"step": 2560,
"valid_targets_mean": 4715.4,
"valid_targets_min": 388
},
{
"epoch": 3.78877400295421,
"grad_norm": 0.4555515812161259,
"learning_rate": 2.0626006472597203e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2008768618106842,
"step": 2565,
"valid_targets_mean": 4623.0,
"valid_targets_min": 731
},
{
"epoch": 3.79615952732644,
"grad_norm": 0.459171004943161,
"learning_rate": 2.055237863363424e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21966755390167236,
"step": 2570,
"valid_targets_mean": 4648.9,
"valid_targets_min": 615
},
{
"epoch": 3.803545051698671,
"grad_norm": 0.4284579195415132,
"learning_rate": 2.047874330197612e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17750242352485657,
"step": 2575,
"valid_targets_mean": 5786.1,
"valid_targets_min": 697
},
{
"epoch": 3.810930576070901,
"grad_norm": 0.5052628017425496,
"learning_rate": 2.040510147644332e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1922721564769745,
"step": 2580,
"valid_targets_mean": 4639.9,
"valid_targets_min": 664
},
{
"epoch": 3.8183161004431314,
"grad_norm": 0.5209698856989999,
"learning_rate": 2.033145415594441e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749410480260849,
"step": 2585,
"valid_targets_mean": 4522.6,
"valid_targets_min": 314
},
{
"epoch": 3.8257016248153617,
"grad_norm": 0.5289497505816443,
"learning_rate": 2.0257802339462497e-05,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2323957085609436,
"step": 2590,
"valid_targets_mean": 3958.1,
"valid_targets_min": 257
},
{
"epoch": 3.8330871491875924,
"grad_norm": 0.4429473903371753,
"learning_rate": 2.018414702604167e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17129692435264587,
"step": 2595,
"valid_targets_mean": 4951.2,
"valid_targets_min": 535
},
{
"epoch": 3.8404726735598227,
"grad_norm": 0.5664110286490077,
"learning_rate": 2.011048921477345e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19464537501335144,
"step": 2600,
"valid_targets_mean": 4107.1,
"valid_targets_min": 743
},
{
"epoch": 3.8478581979320534,
"grad_norm": 0.48372759494178025,
"learning_rate": 2.0036829904783234e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15631017088890076,
"step": 2605,
"valid_targets_mean": 5911.1,
"valid_targets_min": 535
},
{
"epoch": 3.8552437223042837,
"grad_norm": 0.5771058795231779,
"learning_rate": 1.996317009521677e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16237816214561462,
"step": 2610,
"valid_targets_mean": 4347.8,
"valid_targets_min": 565
},
{
"epoch": 3.862629246676514,
"grad_norm": 0.3451442793961211,
"learning_rate": 1.9889510785226556e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16310572624206543,
"step": 2615,
"valid_targets_mean": 6855.8,
"valid_targets_min": 537
},
{
"epoch": 3.8700147710487443,
"grad_norm": 0.47160578182778307,
"learning_rate": 1.981585297395833e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18903210759162903,
"step": 2620,
"valid_targets_mean": 4925.4,
"valid_targets_min": 490
},
{
"epoch": 3.877400295420975,
"grad_norm": 0.4112730275680861,
"learning_rate": 1.9742197660537503e-05,
"loss": 0.1801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1774231493473053,
"step": 2625,
"valid_targets_mean": 4865.4,
"valid_targets_min": 566
},
{
"epoch": 3.8847858197932053,
"grad_norm": 0.3852153308078606,
"learning_rate": 1.96685458440556e-05,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21487516164779663,
"step": 2630,
"valid_targets_mean": 6536.1,
"valid_targets_min": 666
},
{
"epoch": 3.892171344165436,
"grad_norm": 0.4266578300389501,
"learning_rate": 1.9594898523556688e-05,
"loss": 0.2017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1812269687652588,
"step": 2635,
"valid_targets_mean": 4853.8,
"valid_targets_min": 509
},
{
"epoch": 3.8995568685376663,
"grad_norm": 0.47478356489339524,
"learning_rate": 1.952125669802389e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1804153323173523,
"step": 2640,
"valid_targets_mean": 4120.0,
"valid_targets_min": 229
},
{
"epoch": 3.9069423929098965,
"grad_norm": 0.3984291783021106,
"learning_rate": 1.944762136636577e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14626066386699677,
"step": 2645,
"valid_targets_mean": 5470.4,
"valid_targets_min": 482
},
{
"epoch": 3.914327917282127,
"grad_norm": 0.4145840145456443,
"learning_rate": 1.9373993527402803e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17797842621803284,
"step": 2650,
"valid_targets_mean": 5413.2,
"valid_targets_min": 524
},
{
"epoch": 3.9217134416543575,
"grad_norm": 0.43768905570389377,
"learning_rate": 1.930037417985384e-05,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1793164610862732,
"step": 2655,
"valid_targets_mean": 4557.5,
"valid_targets_min": 563
},
{
"epoch": 3.929098966026588,
"grad_norm": 0.4471133890380236,
"learning_rate": 1.9226764322322554e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21864616870880127,
"step": 2660,
"valid_targets_mean": 5254.9,
"valid_targets_min": 788
},
{
"epoch": 3.9364844903988185,
"grad_norm": 0.4345555815624583,
"learning_rate": 1.915316495328388e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18304719030857086,
"step": 2665,
"valid_targets_mean": 4897.6,
"valid_targets_min": 530
},
{
"epoch": 3.943870014771049,
"grad_norm": 0.46340151961537496,
"learning_rate": 1.9079577071070486e-05,
"loss": 0.1697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1812700629234314,
"step": 2670,
"valid_targets_mean": 4532.0,
"valid_targets_min": 570
},
{
"epoch": 3.951255539143279,
"grad_norm": 0.46722063462251806,
"learning_rate": 1.9006001673859236e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18102481961250305,
"step": 2675,
"valid_targets_mean": 4135.3,
"valid_targets_min": 531
},
{
"epoch": 3.9586410635155094,
"grad_norm": 0.46809132826813665,
"learning_rate": 1.8932439759657628e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036694884300232,
"step": 2680,
"valid_targets_mean": 4903.4,
"valid_targets_min": 455
},
{
"epoch": 3.96602658788774,
"grad_norm": 0.4224456008680522,
"learning_rate": 1.8858892326290283e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20503783226013184,
"step": 2685,
"valid_targets_mean": 4960.2,
"valid_targets_min": 563
},
{
"epoch": 3.9734121122599704,
"grad_norm": 0.3976755577199375,
"learning_rate": 1.878536037138539e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16833657026290894,
"step": 2690,
"valid_targets_mean": 5052.5,
"valid_targets_min": 660
},
{
"epoch": 3.980797636632201,
"grad_norm": 0.4015922991970415,
"learning_rate": 1.8711844892361187e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17497824132442474,
"step": 2695,
"valid_targets_mean": 6211.0,
"valid_targets_min": 703
},
{
"epoch": 3.9881831610044314,
"grad_norm": 0.46100259598039117,
"learning_rate": 1.8638346886412427e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17598775029182434,
"step": 2700,
"valid_targets_mean": 4511.3,
"valid_targets_min": 677
},
{
"epoch": 3.9955686853766617,
"grad_norm": 0.5263845759468841,
"learning_rate": 1.8564867350496845e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1905372142791748,
"step": 2705,
"valid_targets_mean": 3814.4,
"valid_targets_min": 561
},
{
"epoch": 4.002954209748892,
"grad_norm": 0.34980228182591305,
"learning_rate": 1.8491407281321647e-05,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14900560677051544,
"step": 2710,
"valid_targets_mean": 6249.2,
"valid_targets_min": 320
},
{
"epoch": 4.010339734121122,
"grad_norm": 0.5143265300926454,
"learning_rate": 1.8417967675329975e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17539595067501068,
"step": 2715,
"valid_targets_mean": 3539.0,
"valid_targets_min": 433
},
{
"epoch": 4.017725258493353,
"grad_norm": 0.3935516918907612,
"learning_rate": 1.8344549528687423e-05,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18661487102508545,
"step": 2720,
"valid_targets_mean": 6973.4,
"valid_targets_min": 441
},
{
"epoch": 4.025110782865584,
"grad_norm": 0.44755179204475903,
"learning_rate": 1.8271153837268464e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15159180760383606,
"step": 2725,
"valid_targets_mean": 4417.1,
"valid_targets_min": 673
},
{
"epoch": 4.032496307237814,
"grad_norm": 0.42283273517778147,
"learning_rate": 1.8197781596643e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18647818267345428,
"step": 2730,
"valid_targets_mean": 5626.2,
"valid_targets_min": 648
},
{
"epoch": 4.039881831610044,
"grad_norm": 0.39804774495793865,
"learning_rate": 1.812443380206285e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13898664712905884,
"step": 2735,
"valid_targets_mean": 5607.3,
"valid_targets_min": 827
},
{
"epoch": 4.0472673559822745,
"grad_norm": 0.4952592545309753,
"learning_rate": 1.805111144844821e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17651236057281494,
"step": 2740,
"valid_targets_mean": 4273.1,
"valid_targets_min": 564
},
{
"epoch": 4.054652880354505,
"grad_norm": 0.5267789359486101,
"learning_rate": 1.7977815530374207e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16626033186912537,
"step": 2745,
"valid_targets_mean": 3623.0,
"valid_targets_min": 125
},
{
"epoch": 4.062038404726736,
"grad_norm": 0.5196745978105738,
"learning_rate": 1.7904547042057364e-05,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16587507724761963,
"step": 2750,
"valid_targets_mean": 4396.9,
"valid_targets_min": 466
},
{
"epoch": 4.069423929098966,
"grad_norm": 0.4220475584040045,
"learning_rate": 1.7831306977342152e-05,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14500692486763,
"step": 2755,
"valid_targets_mean": 4850.2,
"valid_targets_min": 524
},
{
"epoch": 4.0768094534711965,
"grad_norm": 0.42814857370303006,
"learning_rate": 1.7758096329687488e-05,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13999520242214203,
"step": 2760,
"valid_targets_mean": 5521.1,
"valid_targets_min": 606
},
{
"epoch": 4.084194977843427,
"grad_norm": 0.3859057452591373,
"learning_rate": 1.7684916092153262e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14261415600776672,
"step": 2765,
"valid_targets_mean": 5565.9,
"valid_targets_min": 672
},
{
"epoch": 4.091580502215657,
"grad_norm": 0.42241050834024985,
"learning_rate": 1.7611767257386864e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1470344364643097,
"step": 2770,
"valid_targets_mean": 5220.9,
"valid_targets_min": 674
},
{
"epoch": 4.098966026587887,
"grad_norm": 0.416789874748107,
"learning_rate": 1.753865081760973e-05,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17493118345737457,
"step": 2775,
"valid_targets_mean": 5951.9,
"valid_targets_min": 606
},
{
"epoch": 4.1063515509601185,
"grad_norm": 0.46960220255251917,
"learning_rate": 1.7465567764603876e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17590011656284332,
"step": 2780,
"valid_targets_mean": 4606.5,
"valid_targets_min": 605
},
{
"epoch": 4.113737075332349,
"grad_norm": 0.4907659502885251,
"learning_rate": 1.739251908969844e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20186254382133484,
"step": 2785,
"valid_targets_mean": 4470.1,
"valid_targets_min": 718
},
{
"epoch": 4.121122599704579,
"grad_norm": 0.3933868369919279,
"learning_rate": 1.7319505783756248e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12017552554607391,
"step": 2790,
"valid_targets_mean": 6450.1,
"valid_targets_min": 476
},
{
"epoch": 4.128508124076809,
"grad_norm": 0.4949323916381371,
"learning_rate": 1.724652883716037e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15612033009529114,
"step": 2795,
"valid_targets_mean": 4150.4,
"valid_targets_min": 518
},
{
"epoch": 4.13589364844904,
"grad_norm": 0.40509378331922025,
"learning_rate": 1.7173589239800673e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22377564013004303,
"step": 2800,
"valid_targets_mean": 6398.9,
"valid_targets_min": 838
},
{
"epoch": 4.14327917282127,
"grad_norm": 0.4108689853913775,
"learning_rate": 1.7100687981060405e-05,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1769275963306427,
"step": 2805,
"valid_targets_mean": 6090.0,
"valid_targets_min": 1026
},
{
"epoch": 4.150664697193501,
"grad_norm": 0.5162692493811,
"learning_rate": 1.7027826049802787e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1626986861228943,
"step": 2810,
"valid_targets_mean": 3471.9,
"valid_targets_min": 454
},
{
"epoch": 4.158050221565731,
"grad_norm": 0.5312767885071268,
"learning_rate": 1.6955004434357557e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20601385831832886,
"step": 2815,
"valid_targets_mean": 4762.1,
"valid_targets_min": 355
},
{
"epoch": 4.165435745937962,
"grad_norm": 0.4235145894913193,
"learning_rate": 1.6882224122507617e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1396898776292801,
"step": 2820,
"valid_targets_mean": 5606.3,
"valid_targets_min": 456
},
{
"epoch": 4.172821270310192,
"grad_norm": 0.416756640748203,
"learning_rate": 1.6809486101475595e-05,
"loss": 0.1631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21778830885887146,
"step": 2825,
"valid_targets_mean": 7377.4,
"valid_targets_min": 657
},
{
"epoch": 4.180206794682422,
"grad_norm": 0.5252822718202776,
"learning_rate": 1.673679135791049e-05,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19100016355514526,
"step": 2830,
"valid_targets_mean": 4078.6,
"valid_targets_min": 584
},
{
"epoch": 4.1875923190546525,
"grad_norm": 0.529831098741841,
"learning_rate": 1.6664140877874245e-05,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18276384472846985,
"step": 2835,
"valid_targets_mean": 3844.6,
"valid_targets_min": 532
},
{
"epoch": 4.194977843426884,
"grad_norm": 0.3492533131434477,
"learning_rate": 1.65915356468284e-05,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11477085202932358,
"step": 2840,
"valid_targets_mean": 7473.1,
"valid_targets_min": 829
},
{
"epoch": 4.202363367799114,
"grad_norm": 0.46188579373201377,
"learning_rate": 1.651897664962072e-05,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15958110988140106,
"step": 2845,
"valid_targets_mean": 4629.6,
"valid_targets_min": 477
},
{
"epoch": 4.209748892171344,
"grad_norm": 0.36990404396979687,
"learning_rate": 1.644646487047184e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1521548181772232,
"step": 2850,
"valid_targets_mean": 7015.2,
"valid_targets_min": 861
},
{
"epoch": 4.2171344165435745,
"grad_norm": 0.4062689203699344,
"learning_rate": 1.6374001292961915e-05,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495155543088913,
"step": 2855,
"valid_targets_mean": 5666.6,
"valid_targets_min": 760
},
{
"epoch": 4.224519940915805,
"grad_norm": 0.4252533883734268,
"learning_rate": 1.630158690001723e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17348308861255646,
"step": 2860,
"valid_targets_mean": 5389.8,
"valid_targets_min": 461
},
{
"epoch": 4.231905465288035,
"grad_norm": 0.44977416984855956,
"learning_rate": 1.6229222673896977e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19169771671295166,
"step": 2865,
"valid_targets_mean": 6240.2,
"valid_targets_min": 648
},
{
"epoch": 4.239290989660266,
"grad_norm": 0.517268002202166,
"learning_rate": 1.615690959617981e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724705845117569,
"step": 2870,
"valid_targets_mean": 4480.9,
"valid_targets_min": 546
},
{
"epoch": 4.2466765140324965,
"grad_norm": 0.5034227859483678,
"learning_rate": 1.608464864775061e-05,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15206247568130493,
"step": 2875,
"valid_targets_mean": 5756.9,
"valid_targets_min": 883
},
{
"epoch": 4.254062038404727,
"grad_norm": 0.3934998046892,
"learning_rate": 1.601244080878715e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1561555415391922,
"step": 2880,
"valid_targets_mean": 7151.8,
"valid_targets_min": 637
},
{
"epoch": 4.261447562776957,
"grad_norm": 0.4021841720607587,
"learning_rate": 1.5940287058746805e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14158207178115845,
"step": 2885,
"valid_targets_mean": 4988.3,
"valid_targets_min": 691
},
{
"epoch": 4.268833087149187,
"grad_norm": 0.6182741776921272,
"learning_rate": 1.5868188376353258e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1992129683494568,
"step": 2890,
"valid_targets_mean": 5678.7,
"valid_targets_min": 778
},
{
"epoch": 4.2762186115214185,
"grad_norm": 0.4614176577748903,
"learning_rate": 1.579614573958324e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17441459000110626,
"step": 2895,
"valid_targets_mean": 5331.5,
"valid_targets_min": 324
},
{
"epoch": 4.283604135893649,
"grad_norm": 0.5039839970397774,
"learning_rate": 1.5724160125653253e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18613968789577484,
"step": 2900,
"valid_targets_mean": 4360.8,
"valid_targets_min": 575
},
{
"epoch": 4.290989660265879,
"grad_norm": 0.56591190309574,
"learning_rate": 1.5652232511006313e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21027769148349762,
"step": 2905,
"valid_targets_mean": 3856.9,
"valid_targets_min": 362
},
{
"epoch": 4.298375184638109,
"grad_norm": 0.5045039977125617,
"learning_rate": 1.5580363871298713e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15514475107192993,
"step": 2910,
"valid_targets_mean": 4200.1,
"valid_targets_min": 425
},
{
"epoch": 4.30576070901034,
"grad_norm": 0.5630509270539151,
"learning_rate": 1.550855518138679e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2181616574525833,
"step": 2915,
"valid_targets_mean": 3684.9,
"valid_targets_min": 668
},
{
"epoch": 4.31314623338257,
"grad_norm": 0.50018909523244,
"learning_rate": 1.543680741531368e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1719134896993637,
"step": 2920,
"valid_targets_mean": 4710.3,
"valid_targets_min": 575
},
{
"epoch": 4.3205317577548,
"grad_norm": 0.446233266875378,
"learning_rate": 1.536512154629615e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15354609489440918,
"step": 2925,
"valid_targets_mean": 4676.2,
"valid_targets_min": 538
},
{
"epoch": 4.327917282127031,
"grad_norm": 0.4418361621253541,
"learning_rate": 1.5293498546711347e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21994024515151978,
"step": 2930,
"valid_targets_mean": 5910.9,
"valid_targets_min": 541
},
{
"epoch": 4.335302806499262,
"grad_norm": 0.43246616750276806,
"learning_rate": 1.5221939388083638e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14813780784606934,
"step": 2935,
"valid_targets_mean": 5155.4,
"valid_targets_min": 608
},
{
"epoch": 4.342688330871492,
"grad_norm": 0.5184902584890491,
"learning_rate": 1.5150445041071418e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18272896111011505,
"step": 2940,
"valid_targets_mean": 3901.2,
"valid_targets_min": 708
},
{
"epoch": 4.350073855243722,
"grad_norm": 0.46142756709679333,
"learning_rate": 1.5079016475453974e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15337729454040527,
"step": 2945,
"valid_targets_mean": 4455.8,
"valid_targets_min": 477
},
{
"epoch": 4.357459379615952,
"grad_norm": 0.4202013962683297,
"learning_rate": 1.500765466011827e-05,
"loss": 0.1425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14253225922584534,
"step": 2950,
"valid_targets_mean": 5328.2,
"valid_targets_min": 747
},
{
"epoch": 4.364844903988184,
"grad_norm": 0.4223795000780752,
"learning_rate": 1.4936360563045863e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1546299159526825,
"step": 2955,
"valid_targets_mean": 4801.2,
"valid_targets_min": 228
},
{
"epoch": 4.372230428360414,
"grad_norm": 0.5947413428907822,
"learning_rate": 1.4865135151299756e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18521949648857117,
"step": 2960,
"valid_targets_mean": 3601.5,
"valid_targets_min": 481
},
{
"epoch": 4.379615952732644,
"grad_norm": 0.4824214614001069,
"learning_rate": 1.4793979391011264e-05,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1658276468515396,
"step": 2965,
"valid_targets_mean": 4537.8,
"valid_targets_min": 596
},
{
"epoch": 4.387001477104874,
"grad_norm": 0.4535168608231596,
"learning_rate": 1.4722894247366925e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17292077839374542,
"step": 2970,
"valid_targets_mean": 4852.9,
"valid_targets_min": 215
},
{
"epoch": 4.394387001477105,
"grad_norm": 0.43921335228854064,
"learning_rate": 1.4651880684595394e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18284352123737335,
"step": 2975,
"valid_targets_mean": 5821.1,
"valid_targets_min": 552
},
{
"epoch": 4.401772525849335,
"grad_norm": 0.47059015487422473,
"learning_rate": 1.4580939665954396e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612253487110138,
"step": 2980,
"valid_targets_mean": 4167.0,
"valid_targets_min": 686
},
{
"epoch": 4.409158050221565,
"grad_norm": 0.6361271510225736,
"learning_rate": 1.4510072153717613e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17631939053535461,
"step": 2985,
"valid_targets_mean": 3730.2,
"valid_targets_min": 626
},
{
"epoch": 4.416543574593796,
"grad_norm": 0.4847929947491163,
"learning_rate": 1.4439279109161673e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16035814583301544,
"step": 2990,
"valid_targets_mean": 4219.9,
"valid_targets_min": 652
},
{
"epoch": 4.423929098966027,
"grad_norm": 0.4246728217669771,
"learning_rate": 1.4368561492553074e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19435647130012512,
"step": 2995,
"valid_targets_mean": 5936.1,
"valid_targets_min": 615
},
{
"epoch": 4.431314623338257,
"grad_norm": 0.5841115607984504,
"learning_rate": 1.4297920263135194e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18300238251686096,
"step": 3000,
"valid_targets_mean": 3174.0,
"valid_targets_min": 355
},
{
"epoch": 4.438700147710487,
"grad_norm": 0.44672860156890554,
"learning_rate": 1.4227356379115256e-05,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18793809413909912,
"step": 3005,
"valid_targets_mean": 5597.8,
"valid_targets_min": 879
},
{
"epoch": 4.4460856720827175,
"grad_norm": 0.38476310411513204,
"learning_rate": 1.4156870797651343e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1833447515964508,
"step": 3010,
"valid_targets_mean": 6966.1,
"valid_targets_min": 506
},
{
"epoch": 4.453471196454949,
"grad_norm": 0.42279572173644614,
"learning_rate": 1.4086464474839399e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1899091899394989,
"step": 3015,
"valid_targets_mean": 5839.3,
"valid_targets_min": 816
},
{
"epoch": 4.460856720827179,
"grad_norm": 0.44031418366204805,
"learning_rate": 1.4016138365700283e-05,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17797401547431946,
"step": 3020,
"valid_targets_mean": 6834.4,
"valid_targets_min": 628
},
{
"epoch": 4.468242245199409,
"grad_norm": 0.48920064870797775,
"learning_rate": 1.3945893424166799e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18216978013515472,
"step": 3025,
"valid_targets_mean": 4377.6,
"valid_targets_min": 573
},
{
"epoch": 4.4756277695716395,
"grad_norm": 0.4860440678191081,
"learning_rate": 1.3875730603070755e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17842218279838562,
"step": 3030,
"valid_targets_mean": 4298.3,
"valid_targets_min": 519
},
{
"epoch": 4.48301329394387,
"grad_norm": 0.5122645397551936,
"learning_rate": 1.3805650854130042e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16408318281173706,
"step": 3035,
"valid_targets_mean": 5356.2,
"valid_targets_min": 612
},
{
"epoch": 4.4903988183161,
"grad_norm": 0.5777970599819502,
"learning_rate": 1.3735655127935727e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18035376071929932,
"step": 3040,
"valid_targets_mean": 3534.7,
"valid_targets_min": 510
},
{
"epoch": 4.497784342688331,
"grad_norm": 0.40634258250665284,
"learning_rate": 1.3665744373939165e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1392553746700287,
"step": 3045,
"valid_targets_mean": 6123.2,
"valid_targets_min": 768
},
{
"epoch": 4.5051698670605616,
"grad_norm": 0.4222640132338195,
"learning_rate": 1.3595919540439098e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15259933471679688,
"step": 3050,
"valid_targets_mean": 4889.3,
"valid_targets_min": 475
},
{
"epoch": 4.512555391432792,
"grad_norm": 0.42710032158994776,
"learning_rate": 1.352618157456882e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1755707710981369,
"step": 3055,
"valid_targets_mean": 5323.7,
"valid_targets_min": 573
},
{
"epoch": 4.519940915805022,
"grad_norm": 0.4546554151450125,
"learning_rate": 1.3456531422283314e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16564080119132996,
"step": 3060,
"valid_targets_mean": 5748.6,
"valid_targets_min": 635
},
{
"epoch": 4.527326440177252,
"grad_norm": 0.3920659302495498,
"learning_rate": 1.3386970028346414e-05,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14143362641334534,
"step": 3065,
"valid_targets_mean": 6217.1,
"valid_targets_min": 637
},
{
"epoch": 4.534711964549483,
"grad_norm": 0.6631096404799323,
"learning_rate": 1.3317498336318001e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14858531951904297,
"step": 3070,
"valid_targets_mean": 5357.5,
"valid_targets_min": 802
},
{
"epoch": 4.542097488921714,
"grad_norm": 0.36924744404698256,
"learning_rate": 1.3248117288541224e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15762075781822205,
"step": 3075,
"valid_targets_mean": 6748.7,
"valid_targets_min": 1209
},
{
"epoch": 4.549483013293944,
"grad_norm": 0.4132566623757397,
"learning_rate": 1.3178827826129653e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15297694504261017,
"step": 3080,
"valid_targets_mean": 5218.4,
"valid_targets_min": 629
},
{
"epoch": 4.556868537666174,
"grad_norm": 0.6105683360071116,
"learning_rate": 1.3109630888954586e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18115362524986267,
"step": 3085,
"valid_targets_mean": 2799.2,
"valid_targets_min": 518
},
{
"epoch": 4.564254062038405,
"grad_norm": 0.4312209357104268,
"learning_rate": 1.3040527415632264e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13422748446464539,
"step": 3090,
"valid_targets_mean": 5207.3,
"valid_targets_min": 750
},
{
"epoch": 4.571639586410635,
"grad_norm": 0.5345112264129266,
"learning_rate": 1.297151834351115e-05,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2037266194820404,
"step": 3095,
"valid_targets_mean": 4426.9,
"valid_targets_min": 584
},
{
"epoch": 4.579025110782865,
"grad_norm": 0.48644514959603063,
"learning_rate": 1.2902604608659195e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19521738588809967,
"step": 3100,
"valid_targets_mean": 4656.5,
"valid_targets_min": 536
},
{
"epoch": 4.586410635155096,
"grad_norm": 0.4686584623782236,
"learning_rate": 1.2833787145851164e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16689223051071167,
"step": 3105,
"valid_targets_mean": 4490.6,
"valid_targets_min": 675
},
{
"epoch": 4.593796159527327,
"grad_norm": 0.4343439566599933,
"learning_rate": 1.2765066888555957e-05,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19107720255851746,
"step": 3110,
"valid_targets_mean": 5998.3,
"valid_targets_min": 735
},
{
"epoch": 4.601181683899557,
"grad_norm": 0.48092468519713316,
"learning_rate": 1.2696444768923919e-05,
"loss": 0.1721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18640181422233582,
"step": 3115,
"valid_targets_mean": 4409.0,
"valid_targets_min": 492
},
{
"epoch": 4.608567208271787,
"grad_norm": 0.3949210579717376,
"learning_rate": 1.2627921717774236e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16668841242790222,
"step": 3120,
"valid_targets_mean": 6662.4,
"valid_targets_min": 375
},
{
"epoch": 4.6159527326440175,
"grad_norm": 0.3653101251021582,
"learning_rate": 1.2559498664582259e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17200833559036255,
"step": 3125,
"valid_targets_mean": 7024.5,
"valid_targets_min": 691
},
{
"epoch": 4.623338257016248,
"grad_norm": 0.5353189616488072,
"learning_rate": 1.2491176537466951e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18706795573234558,
"step": 3130,
"valid_targets_mean": 3664.9,
"valid_targets_min": 553
},
{
"epoch": 4.630723781388479,
"grad_norm": 0.48483146785334685,
"learning_rate": 1.242295626317826e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18977820873260498,
"step": 3135,
"valid_targets_mean": 4671.8,
"valid_targets_min": 541
},
{
"epoch": 4.638109305760709,
"grad_norm": 0.4576012336580824,
"learning_rate": 1.2354838767084563e-05,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621273159980774,
"step": 3140,
"valid_targets_mean": 4912.6,
"valid_targets_min": 547
},
{
"epoch": 4.6454948301329395,
"grad_norm": 0.47408165212071834,
"learning_rate": 1.2286824973160103e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14935819804668427,
"step": 3145,
"valid_targets_mean": 4476.2,
"valid_targets_min": 654
},
{
"epoch": 4.65288035450517,
"grad_norm": 0.35823980053826326,
"learning_rate": 1.2218915803972478e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15744267404079437,
"step": 3150,
"valid_targets_mean": 6967.7,
"valid_targets_min": 639
},
{
"epoch": 4.6602658788774,
"grad_norm": 0.3938649437885737,
"learning_rate": 1.2151112180670097e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15055982768535614,
"step": 3155,
"valid_targets_mean": 6357.4,
"valid_targets_min": 2129
},
{
"epoch": 4.66765140324963,
"grad_norm": 0.4159919225396087,
"learning_rate": 1.2083415022969712e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428435891866684,
"step": 3160,
"valid_targets_mean": 5190.1,
"valid_targets_min": 589
},
{
"epoch": 4.6750369276218615,
"grad_norm": 0.321718436567835,
"learning_rate": 1.2015825249143926e-05,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11123082041740417,
"step": 3165,
"valid_targets_mean": 6443.4,
"valid_targets_min": 550
},
{
"epoch": 4.682422451994092,
"grad_norm": 0.5181376093279889,
"learning_rate": 1.1948343776008738e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18044036626815796,
"step": 3170,
"valid_targets_mean": 5152.0,
"valid_targets_min": 476
},
{
"epoch": 4.689807976366322,
"grad_norm": 0.3835319842919287,
"learning_rate": 1.1880971518911112e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1430322527885437,
"step": 3175,
"valid_targets_mean": 5503.8,
"valid_targets_min": 599
},
{
"epoch": 4.697193500738552,
"grad_norm": 0.38392579284693557,
"learning_rate": 1.1813709391716568e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14627256989479065,
"step": 3180,
"valid_targets_mean": 6006.3,
"valid_targets_min": 649
},
{
"epoch": 4.704579025110783,
"grad_norm": 0.4621220677999244,
"learning_rate": 1.1746558306796776e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17970584332942963,
"step": 3185,
"valid_targets_mean": 4955.9,
"valid_targets_min": 676
},
{
"epoch": 4.711964549483013,
"grad_norm": 0.4500367333603124,
"learning_rate": 1.1679519175017174e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14992380142211914,
"step": 3190,
"valid_targets_mean": 4324.4,
"valid_targets_min": 615
},
{
"epoch": 4.719350073855244,
"grad_norm": 0.4306455292259303,
"learning_rate": 1.161259290572462e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1760706901550293,
"step": 3195,
"valid_targets_mean": 5846.6,
"valid_targets_min": 714
},
{
"epoch": 4.726735598227474,
"grad_norm": 0.5361598584911511,
"learning_rate": 1.1545780406735081e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16949506103992462,
"step": 3200,
"valid_targets_mean": 3808.7,
"valid_targets_min": 608
},
{
"epoch": 4.734121122599705,
"grad_norm": 0.4278388705938128,
"learning_rate": 1.1479082584321265e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16112419962882996,
"step": 3205,
"valid_targets_mean": 5402.7,
"valid_targets_min": 614
},
{
"epoch": 4.741506646971935,
"grad_norm": 0.4272816557388593,
"learning_rate": 1.1412500343200384e-05,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13227397203445435,
"step": 3210,
"valid_targets_mean": 5582.8,
"valid_targets_min": 229
},
{
"epoch": 4.748892171344165,
"grad_norm": 0.47634077338014624,
"learning_rate": 1.1346034586521828e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17866167426109314,
"step": 3215,
"valid_targets_mean": 4475.9,
"valid_targets_min": 595
},
{
"epoch": 4.7562776957163955,
"grad_norm": 0.4344869468282722,
"learning_rate": 1.127968621585497e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15781113505363464,
"step": 3220,
"valid_targets_mean": 5149.8,
"valid_targets_min": 702
},
{
"epoch": 4.763663220088627,
"grad_norm": 0.4467123123517859,
"learning_rate": 1.1213456131176894e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13696205615997314,
"step": 3225,
"valid_targets_mean": 4635.4,
"valid_targets_min": 355
},
{
"epoch": 4.771048744460857,
"grad_norm": 0.6578561115499146,
"learning_rate": 1.1147345230860225e-05,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1457718312740326,
"step": 3230,
"valid_targets_mean": 5075.1,
"valid_targets_min": 380
},
{
"epoch": 4.778434268833087,
"grad_norm": 0.47187291081005306,
"learning_rate": 1.1081354411660899e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22649861872196198,
"step": 3235,
"valid_targets_mean": 5602.9,
"valid_targets_min": 385
},
{
"epoch": 4.7858197932053175,
"grad_norm": 0.4585294146600305,
"learning_rate": 1.1015484568706025e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15446168184280396,
"step": 3240,
"valid_targets_mean": 4190.6,
"valid_targets_min": 401
},
{
"epoch": 4.793205317577548,
"grad_norm": 0.4721836321102142,
"learning_rate": 1.0949736595481748e-05,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16026848554611206,
"step": 3245,
"valid_targets_mean": 4162.0,
"valid_targets_min": 211
},
{
"epoch": 4.800590841949779,
"grad_norm": 0.5097924145730403,
"learning_rate": 1.0884111383821115e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1608010232448578,
"step": 3250,
"valid_targets_mean": 4100.3,
"valid_targets_min": 559
},
{
"epoch": 4.807976366322009,
"grad_norm": 0.5121344596400246,
"learning_rate": 1.0818609823891988e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18942126631736755,
"step": 3255,
"valid_targets_mean": 4584.4,
"valid_targets_min": 529
},
{
"epoch": 4.8153618906942395,
"grad_norm": 0.39125128571958845,
"learning_rate": 1.0753232804184944e-05,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1385767161846161,
"step": 3260,
"valid_targets_mean": 5840.9,
"valid_targets_min": 696
},
{
"epoch": 4.82274741506647,
"grad_norm": 0.519147963569654,
"learning_rate": 1.0687981211501286e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13257870078086853,
"step": 3265,
"valid_targets_mean": 5252.2,
"valid_targets_min": 832
},
{
"epoch": 4.8301329394387,
"grad_norm": 0.3882601827065478,
"learning_rate": 1.0622855930940935e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16074441373348236,
"step": 3270,
"valid_targets_mean": 5536.7,
"valid_targets_min": 717
},
{
"epoch": 4.83751846381093,
"grad_norm": 0.5424919781622314,
"learning_rate": 1.0557857845890486e-05,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19361868500709534,
"step": 3275,
"valid_targets_mean": 4543.6,
"valid_targets_min": 246
},
{
"epoch": 4.844903988183161,
"grad_norm": 0.5134917623818339,
"learning_rate": 1.049298783801118e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1247122585773468,
"step": 3280,
"valid_targets_mean": 4817.4,
"valid_targets_min": 457
},
{
"epoch": 4.852289512555392,
"grad_norm": 0.4500612814479838,
"learning_rate": 1.0428246787226979e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16459113359451294,
"step": 3285,
"valid_targets_mean": 4635.2,
"valid_targets_min": 531
},
{
"epoch": 4.859675036927622,
"grad_norm": 0.4535219744538525,
"learning_rate": 1.0363635571712614e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16566744446754456,
"step": 3290,
"valid_targets_mean": 5096.8,
"valid_targets_min": 592
},
{
"epoch": 4.867060561299852,
"grad_norm": 0.46962696061070613,
"learning_rate": 1.0299155067881673e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19553884863853455,
"step": 3295,
"valid_targets_mean": 5114.3,
"valid_targets_min": 562
},
{
"epoch": 4.874446085672083,
"grad_norm": 0.39252568546578387,
"learning_rate": 1.023480615037472e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1575905829668045,
"step": 3300,
"valid_targets_mean": 5711.9,
"valid_targets_min": 568
},
{
"epoch": 4.881831610044313,
"grad_norm": 4.133528284855488,
"learning_rate": 1.0170589692047428e-05,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13656756281852722,
"step": 3305,
"valid_targets_mean": 4539.4,
"valid_targets_min": 494
},
{
"epoch": 4.889217134416544,
"grad_norm": 0.5686494863470835,
"learning_rate": 1.0106506563958733e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19371378421783447,
"step": 3310,
"valid_targets_mean": 3573.2,
"valid_targets_min": 430
},
{
"epoch": 4.896602658788774,
"grad_norm": 0.4402520543361477,
"learning_rate": 1.0042557635359028e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1665995717048645,
"step": 3315,
"valid_targets_mean": 5250.2,
"valid_targets_min": 495
},
{
"epoch": 4.903988183161005,
"grad_norm": 0.41299530585836114,
"learning_rate": 9.978743773678362e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.173518568277359,
"step": 3320,
"valid_targets_mean": 5918.4,
"valid_targets_min": 583
},
{
"epoch": 4.911373707533235,
"grad_norm": 0.4208459436047827,
"learning_rate": 9.915065844514688e-06,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12593166530132294,
"step": 3325,
"valid_targets_mean": 5046.3,
"valid_targets_min": 298
},
{
"epoch": 4.918759231905465,
"grad_norm": 0.5089228253284505,
"learning_rate": 9.851524711622111e-06,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19019880890846252,
"step": 3330,
"valid_targets_mean": 4365.8,
"valid_targets_min": 683
},
{
"epoch": 4.926144756277695,
"grad_norm": 0.3548181182634598,
"learning_rate": 9.78812123689917e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16198115050792694,
"step": 3335,
"valid_targets_mean": 7325.5,
"valid_targets_min": 469
},
{
"epoch": 4.933530280649926,
"grad_norm": 0.4847190504144033,
"learning_rate": 9.724856280377155e-06,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19115082919597626,
"step": 3340,
"valid_targets_mean": 4280.8,
"valid_targets_min": 655
},
{
"epoch": 4.940915805022157,
"grad_norm": 0.45392216834170873,
"learning_rate": 9.661730700208434e-06,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21955522894859314,
"step": 3345,
"valid_targets_mean": 4720.2,
"valid_targets_min": 383
},
{
"epoch": 4.948301329394387,
"grad_norm": 0.38054470770168214,
"learning_rate": 9.598745352654819e-06,
"loss": 0.1718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16042864322662354,
"step": 3350,
"valid_targets_mean": 5992.3,
"valid_targets_min": 598
},
{
"epoch": 4.955686853766617,
"grad_norm": 0.4603546661973167,
"learning_rate": 9.535901092075945e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17585790157318115,
"step": 3355,
"valid_targets_mean": 4433.1,
"valid_targets_min": 538
},
{
"epoch": 4.963072378138848,
"grad_norm": 0.4507007240993226,
"learning_rate": 9.473198770917686e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13589590787887573,
"step": 3360,
"valid_targets_mean": 5814.6,
"valid_targets_min": 649
},
{
"epoch": 4.970457902511078,
"grad_norm": 0.42542002909001325,
"learning_rate": 9.41063923970059e-06,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16971269249916077,
"step": 3365,
"valid_targets_mean": 5632.9,
"valid_targets_min": 584
},
{
"epoch": 4.977843426883309,
"grad_norm": 0.6339824403474643,
"learning_rate": 9.348223347008342e-06,
"loss": 0.1862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1671033501625061,
"step": 3370,
"valid_targets_mean": 6262.1,
"valid_targets_min": 831
},
{
"epoch": 4.985228951255539,
"grad_norm": 0.4263518906101623,
"learning_rate": 9.285951939476256e-06,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599881947040558,
"step": 3375,
"valid_targets_mean": 4836.1,
"valid_targets_min": 521
},
{
"epoch": 4.99261447562777,
"grad_norm": 0.4552157775554924,
"learning_rate": 9.22382586177978e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17859028279781342,
"step": 3380,
"valid_targets_mean": 5123.1,
"valid_targets_min": 664
},
{
"epoch": 5.0,
"grad_norm": 0.42182388484726885,
"learning_rate": 9.161845956623072e-06,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.125313863158226,
"step": 3385,
"valid_targets_mean": 5043.0,
"valid_targets_min": 661
},
{
"epoch": 5.00738552437223,
"grad_norm": 0.4371353465408426,
"learning_rate": 9.100013064727508e-06,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19350577890872955,
"step": 3390,
"valid_targets_mean": 6081.2,
"valid_targets_min": 591
},
{
"epoch": 5.014771048744461,
"grad_norm": 0.444555503330858,
"learning_rate": 9.038328024820342e-06,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033313512802124,
"step": 3395,
"valid_targets_mean": 5863.6,
"valid_targets_min": 499
},
{
"epoch": 5.022156573116692,
"grad_norm": 0.42165983760825365,
"learning_rate": 8.976791673623289e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15845409035682678,
"step": 3400,
"valid_targets_mean": 5640.8,
"valid_targets_min": 546
},
{
"epoch": 5.029542097488922,
"grad_norm": 0.38297498375540073,
"learning_rate": 8.915404845841194e-06,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11503148823976517,
"step": 3405,
"valid_targets_mean": 7132.4,
"valid_targets_min": 592
},
{
"epoch": 5.036927621861152,
"grad_norm": 0.4953749429257958,
"learning_rate": 8.8541683741507e-06,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14602802693843842,
"step": 3410,
"valid_targets_mean": 4715.0,
"valid_targets_min": 539
},
{
"epoch": 5.044313146233383,
"grad_norm": 0.5095609371925762,
"learning_rate": 8.793083089188953e-06,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1521594226360321,
"step": 3415,
"valid_targets_mean": 4684.5,
"valid_targets_min": 555
},
{
"epoch": 5.051698670605613,
"grad_norm": 0.4523371860610417,
"learning_rate": 8.732149819542362e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15225934982299805,
"step": 3420,
"valid_targets_mean": 5030.1,
"valid_targets_min": 577
},
{
"epoch": 5.059084194977843,
"grad_norm": 0.5280342375496218,
"learning_rate": 8.671369391735304e-06,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14403800666332245,
"step": 3425,
"valid_targets_mean": 5231.7,
"valid_targets_min": 566
},
{
"epoch": 5.066469719350074,
"grad_norm": 0.40798873184330564,
"learning_rate": 8.610742630218978e-06,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13136714696884155,
"step": 3430,
"valid_targets_mean": 6256.9,
"valid_targets_min": 613
},
{
"epoch": 5.073855243722305,
"grad_norm": 0.3861935517496378,
"learning_rate": 8.550270357360149e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12466324865818024,
"step": 3435,
"valid_targets_mean": 5849.4,
"valid_targets_min": 642
},
{
"epoch": 5.081240768094535,
"grad_norm": 0.7401400100882837,
"learning_rate": 8.489953393430066e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1705418825149536,
"step": 3440,
"valid_targets_mean": 3559.2,
"valid_targets_min": 490
},
{
"epoch": 5.088626292466765,
"grad_norm": 0.5193202825498705,
"learning_rate": 8.429792556593293e-06,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22426575422286987,
"step": 3445,
"valid_targets_mean": 5109.2,
"valid_targets_min": 496
},
{
"epoch": 5.096011816838995,
"grad_norm": 0.43168022491540325,
"learning_rate": 8.36978866289661e-06,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17360247671604156,
"step": 3450,
"valid_targets_mean": 5924.7,
"valid_targets_min": 690
},
{
"epoch": 5.103397341211226,
"grad_norm": 0.5111277913511018,
"learning_rate": 8.309942526257982e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14671558141708374,
"step": 3455,
"valid_targets_mean": 4076.2,
"valid_targets_min": 552
},
{
"epoch": 5.110782865583457,
"grad_norm": 0.3745220484810527,
"learning_rate": 8.250254958455466e-06,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13649728894233704,
"step": 3460,
"valid_targets_mean": 6392.8,
"valid_targets_min": 953
},
{
"epoch": 5.118168389955687,
"grad_norm": 0.41895740102958157,
"learning_rate": 8.19072676911623e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16213387250900269,
"step": 3465,
"valid_targets_mean": 5501.8,
"valid_targets_min": 563
},
{
"epoch": 5.125553914327917,
"grad_norm": 0.4621969274320497,
"learning_rate": 8.13135876570557e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1634249985218048,
"step": 3470,
"valid_targets_mean": 5318.6,
"valid_targets_min": 739
},
{
"epoch": 5.132939438700148,
"grad_norm": 0.5101384366926183,
"learning_rate": 8.072151753515963e-06,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18241387605667114,
"step": 3475,
"valid_targets_mean": 4392.2,
"valid_targets_min": 589
},
{
"epoch": 5.140324963072378,
"grad_norm": 0.435494385133351,
"learning_rate": 8.013106535656098e-06,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15624777972698212,
"step": 3480,
"valid_targets_mean": 5854.9,
"valid_targets_min": 671
},
{
"epoch": 5.147710487444608,
"grad_norm": 0.45540841610405663,
"learning_rate": 7.954223913040052e-06,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16797244548797607,
"step": 3485,
"valid_targets_mean": 6307.3,
"valid_targets_min": 650
},
{
"epoch": 5.155096011816839,
"grad_norm": 0.435797126087404,
"learning_rate": 7.895504684376387e-06,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20473451912403107,
"step": 3490,
"valid_targets_mean": 6468.6,
"valid_targets_min": 688
},
{
"epoch": 5.16248153618907,
"grad_norm": 0.4658949563928541,
"learning_rate": 7.836949646157317e-06,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23565639555454254,
"step": 3495,
"valid_targets_mean": 5807.4,
"valid_targets_min": 471
},
{
"epoch": 5.1698670605613,
"grad_norm": 0.6532185606945251,
"learning_rate": 7.778559592647903e-06,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15222051739692688,
"step": 3500,
"valid_targets_mean": 5615.7,
"valid_targets_min": 583
},
{
"epoch": 5.17725258493353,
"grad_norm": 0.37994849707269074,
"learning_rate": 7.720335315875286e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11698979139328003,
"step": 3505,
"valid_targets_mean": 6916.1,
"valid_targets_min": 303
},
{
"epoch": 5.1846381093057605,
"grad_norm": 0.4867862414276969,
"learning_rate": 7.662277605617952e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15551450848579407,
"step": 3510,
"valid_targets_mean": 5208.1,
"valid_targets_min": 692
},
{
"epoch": 5.192023633677991,
"grad_norm": 0.5261180668274233,
"learning_rate": 7.604387249394991e-06,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17861658334732056,
"step": 3515,
"valid_targets_mean": 4572.2,
"valid_targets_min": 643
},
{
"epoch": 5.199409158050222,
"grad_norm": 0.5013761956045906,
"learning_rate": 7.546665032455458e-06,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24076738953590393,
"step": 3520,
"valid_targets_mean": 5969.2,
"valid_targets_min": 952
},
{
"epoch": 5.206794682422452,
"grad_norm": 0.44388940849901665,
"learning_rate": 7.4891117377676555e-06,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1808503419160843,
"step": 3525,
"valid_targets_mean": 5442.9,
"valid_targets_min": 831
},
{
"epoch": 5.2141802067946825,
"grad_norm": 0.3368141280700644,
"learning_rate": 7.431728146008603e-06,
"loss": 0.1428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12330228835344315,
"step": 3530,
"valid_targets_mean": 7554.9,
"valid_targets_min": 804
},
{
"epoch": 5.221565731166913,
"grad_norm": 0.47194572305530047,
"learning_rate": 7.3745150355533665e-06,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1410825550556183,
"step": 3535,
"valid_targets_mean": 4599.2,
"valid_targets_min": 521
},
{
"epoch": 5.228951255539143,
"grad_norm": 0.4589841119409957,
"learning_rate": 7.317473182464543e-06,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14487279951572418,
"step": 3540,
"valid_targets_mean": 5436.2,
"valid_targets_min": 472
},
{
"epoch": 5.236336779911373,
"grad_norm": 0.5079352080568156,
"learning_rate": 7.260603360481719e-06,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.177564337849617,
"step": 3545,
"valid_targets_mean": 4225.0,
"valid_targets_min": 441
},
{
"epoch": 5.2437223042836045,
"grad_norm": 0.4124981604846651,
"learning_rate": 7.20390634101098e-06,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20939132571220398,
"step": 3550,
"valid_targets_mean": 7137.3,
"valid_targets_min": 425
},
{
"epoch": 5.251107828655835,
"grad_norm": 0.4748050711224649,
"learning_rate": 7.147382893114447e-06,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15160918235778809,
"step": 3555,
"valid_targets_mean": 5582.1,
"valid_targets_min": 508
},
{
"epoch": 5.258493353028065,
"grad_norm": 0.49570642663047704,
"learning_rate": 7.091033783499843e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662381887435913,
"step": 3560,
"valid_targets_mean": 4688.8,
"valid_targets_min": 412
},
{
"epoch": 5.265878877400295,
"grad_norm": 0.6444535354021959,
"learning_rate": 7.034859776510094e-06,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18472233414649963,
"step": 3565,
"valid_targets_mean": 2869.7,
"valid_targets_min": 358
},
{
"epoch": 5.273264401772526,
"grad_norm": 0.36003282906413414,
"learning_rate": 6.978861634112959e-06,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11764170229434967,
"step": 3570,
"valid_targets_mean": 7215.8,
"valid_targets_min": 714
},
{
"epoch": 5.280649926144756,
"grad_norm": 0.4363348321964383,
"learning_rate": 6.923040115890698e-06,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14421112835407257,
"step": 3575,
"valid_targets_mean": 5132.3,
"valid_targets_min": 731
},
{
"epoch": 5.288035450516987,
"grad_norm": 0.4270407605139215,
"learning_rate": 6.867395979029763e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15610837936401367,
"step": 3580,
"valid_targets_mean": 5726.0,
"valid_targets_min": 524
},
{
"epoch": 5.295420974889217,
"grad_norm": 0.4372448860288484,
"learning_rate": 6.8119299783105384e-06,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1485387682914734,
"step": 3585,
"valid_targets_mean": 5501.2,
"valid_targets_min": 798
},
{
"epoch": 5.302806499261448,
"grad_norm": 0.49670165229019625,
"learning_rate": 6.756642866097087e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21197667717933655,
"step": 3590,
"valid_targets_mean": 4981.1,
"valid_targets_min": 593
},
{
"epoch": 5.310192023633678,
"grad_norm": 0.4873247420128096,
"learning_rate": 6.701535392326959e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14547309279441833,
"step": 3595,
"valid_targets_mean": 4563.1,
"valid_targets_min": 619
},
{
"epoch": 5.317577548005908,
"grad_norm": 0.4104843544339754,
"learning_rate": 6.646608304501008e-06,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16900783777236938,
"step": 3600,
"valid_targets_mean": 6581.2,
"valid_targets_min": 764
},
{
"epoch": 5.3249630723781385,
"grad_norm": 0.47195907463014314,
"learning_rate": 6.591862347673257e-06,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1981767863035202,
"step": 3605,
"valid_targets_mean": 4831.9,
"valid_targets_min": 710
},
{
"epoch": 5.33234859675037,
"grad_norm": 0.542224951252824,
"learning_rate": 6.537298264440813e-06,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19629326462745667,
"step": 3610,
"valid_targets_mean": 3798.4,
"valid_targets_min": 432
},
{
"epoch": 5.3397341211226,
"grad_norm": 0.35804884095064315,
"learning_rate": 6.482916794933736e-06,
"loss": 0.141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12061704695224762,
"step": 3615,
"valid_targets_mean": 6460.8,
"valid_targets_min": 638
},
{
"epoch": 5.34711964549483,
"grad_norm": 0.49330966651853386,
"learning_rate": 6.428718676805065e-06,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21051400899887085,
"step": 3620,
"valid_targets_mean": 4860.2,
"valid_targets_min": 433
},
{
"epoch": 5.3545051698670605,
"grad_norm": 0.5321457303177618,
"learning_rate": 6.374704645220775e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1549859642982483,
"step": 3625,
"valid_targets_mean": 3886.5,
"valid_targets_min": 466
},
{
"epoch": 5.361890694239291,
"grad_norm": 0.39489790904559613,
"learning_rate": 6.320875432849816e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1310429573059082,
"step": 3630,
"valid_targets_mean": 7088.1,
"valid_targets_min": 584
},
{
"epoch": 5.369276218611521,
"grad_norm": 0.45105096964297986,
"learning_rate": 6.2672317698541695e-06,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540766954421997,
"step": 3635,
"valid_targets_mean": 4639.0,
"valid_targets_min": 560
},
{
"epoch": 5.376661742983752,
"grad_norm": 0.4753836438289837,
"learning_rate": 6.213774383878945e-06,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12997017800807953,
"step": 3640,
"valid_targets_mean": 5125.3,
"valid_targets_min": 526
},
{
"epoch": 5.3840472673559825,
"grad_norm": 0.5042444574219167,
"learning_rate": 6.1605040000425285e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13099181652069092,
"step": 3645,
"valid_targets_mean": 5819.9,
"valid_targets_min": 490
},
{
"epoch": 5.391432791728213,
"grad_norm": 0.3863263579045339,
"learning_rate": 6.107421340926716e-06,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16232043504714966,
"step": 3650,
"valid_targets_mean": 6967.1,
"valid_targets_min": 901
},
{
"epoch": 5.398818316100443,
"grad_norm": 0.5220422627235417,
"learning_rate": 6.054527126566933e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16426241397857666,
"step": 3655,
"valid_targets_mean": 4679.2,
"valid_targets_min": 716
},
{
"epoch": 5.406203840472673,
"grad_norm": 0.4319185540338788,
"learning_rate": 6.0018220744424495e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1663556545972824,
"step": 3660,
"valid_targets_mean": 6097.4,
"valid_targets_min": 602
},
{
"epoch": 5.413589364844904,
"grad_norm": 0.3956255035616646,
"learning_rate": 5.949306899466672e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14825277030467987,
"step": 3665,
"valid_targets_mean": 6583.9,
"valid_targets_min": 691
},
{
"epoch": 5.420974889217135,
"grad_norm": 0.484584083668749,
"learning_rate": 5.8969823139774304e-06,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19931569695472717,
"step": 3670,
"valid_targets_mean": 4773.4,
"valid_targets_min": 597
},
{
"epoch": 5.428360413589365,
"grad_norm": 0.45434367771112616,
"learning_rate": 5.844849027727313e-06,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19150590896606445,
"step": 3675,
"valid_targets_mean": 5992.9,
"valid_targets_min": 505
},
{
"epoch": 5.435745937961595,
"grad_norm": 0.6026865956309536,
"learning_rate": 5.792907747874068e-06,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16173362731933594,
"step": 3680,
"valid_targets_mean": 4554.5,
"valid_targets_min": 573
},
{
"epoch": 5.443131462333826,
"grad_norm": 0.40334097093396654,
"learning_rate": 5.741159178970958e-06,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15286067128181458,
"step": 3685,
"valid_targets_mean": 6434.6,
"valid_targets_min": 894
},
{
"epoch": 5.450516986706056,
"grad_norm": 0.42746203298644087,
"learning_rate": 5.689604022957256e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1851692497730255,
"step": 3690,
"valid_targets_mean": 6208.4,
"valid_targets_min": 584
},
{
"epoch": 5.457902511078286,
"grad_norm": 0.48488271400781807,
"learning_rate": 5.638242979148685e-06,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17530173063278198,
"step": 3695,
"valid_targets_mean": 4681.8,
"valid_targets_min": 369
},
{
"epoch": 5.465288035450517,
"grad_norm": 0.49213245126776284,
"learning_rate": 5.587076744227966e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1436440646648407,
"step": 3700,
"valid_targets_mean": 4852.8,
"valid_targets_min": 349
},
{
"epoch": 5.472673559822748,
"grad_norm": 0.5385593413242621,
"learning_rate": 5.536106012235329e-06,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23084211349487305,
"step": 3705,
"valid_targets_mean": 5293.5,
"valid_targets_min": 733
},
{
"epoch": 5.480059084194978,
"grad_norm": 0.4064012565579344,
"learning_rate": 5.485331474559133e-06,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13796594738960266,
"step": 3710,
"valid_targets_mean": 6042.2,
"valid_targets_min": 491
},
{
"epoch": 5.487444608567208,
"grad_norm": 0.4466176384591676,
"learning_rate": 5.434753819926484e-06,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16316545009613037,
"step": 3715,
"valid_targets_mean": 4737.5,
"valid_targets_min": 662
},
{
"epoch": 5.4948301329394384,
"grad_norm": 0.48204920306109306,
"learning_rate": 5.384373734393871e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12412101030349731,
"step": 3720,
"valid_targets_mean": 4247.8,
"valid_targets_min": 430
},
{
"epoch": 5.50221565731167,
"grad_norm": 0.4423331415810954,
"learning_rate": 5.334191901337875e-06,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16865645349025726,
"step": 3725,
"valid_targets_mean": 5476.6,
"valid_targets_min": 635
},
{
"epoch": 5.5096011816839,
"grad_norm": 0.4261034310873824,
"learning_rate": 5.284209001445901e-06,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1629231870174408,
"step": 3730,
"valid_targets_mean": 5663.4,
"valid_targets_min": 613
},
{
"epoch": 5.51698670605613,
"grad_norm": 0.5270843670535649,
"learning_rate": 5.234425712706938e-06,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1648382544517517,
"step": 3735,
"valid_targets_mean": 4095.7,
"valid_targets_min": 587
},
{
"epoch": 5.5243722304283605,
"grad_norm": 0.4594394151163437,
"learning_rate": 5.184842710402367e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14536496996879578,
"step": 3740,
"valid_targets_mean": 5437.5,
"valid_targets_min": 734
},
{
"epoch": 5.531757754800591,
"grad_norm": 0.54902978481994,
"learning_rate": 5.135460667096806e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20517590641975403,
"step": 3745,
"valid_targets_mean": 4786.9,
"valid_targets_min": 500
},
{
"epoch": 5.539143279172821,
"grad_norm": 0.45086635799096986,
"learning_rate": 5.086280252628955e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15122875571250916,
"step": 3750,
"valid_targets_mean": 4694.8,
"valid_targets_min": 309
},
{
"epoch": 5.546528803545051,
"grad_norm": 0.4417456541588059,
"learning_rate": 5.037302134102575e-06,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16173198819160461,
"step": 3755,
"valid_targets_mean": 5160.4,
"valid_targets_min": 677
},
{
"epoch": 5.5539143279172825,
"grad_norm": 0.4768321706536616,
"learning_rate": 4.988526975877374e-06,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14764034748077393,
"step": 3760,
"valid_targets_mean": 4331.2,
"valid_targets_min": 612
},
{
"epoch": 5.561299852289513,
"grad_norm": 0.41225383767497426,
"learning_rate": 4.939955439560031e-06,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12844733893871307,
"step": 3765,
"valid_targets_mean": 6010.1,
"valid_targets_min": 515
},
{
"epoch": 5.568685376661743,
"grad_norm": 0.46955403794769657,
"learning_rate": 4.891588183995206e-06,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18649445474147797,
"step": 3770,
"valid_targets_mean": 4942.9,
"valid_targets_min": 639
},
{
"epoch": 5.576070901033973,
"grad_norm": 0.3936059528169128,
"learning_rate": 4.8434258652566165e-06,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1388961225748062,
"step": 3775,
"valid_targets_mean": 5572.7,
"valid_targets_min": 635
},
{
"epoch": 5.583456425406204,
"grad_norm": 0.4122457123845285,
"learning_rate": 4.795469136638125e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14227622747421265,
"step": 3780,
"valid_targets_mean": 6029.8,
"valid_targets_min": 535
},
{
"epoch": 5.590841949778435,
"grad_norm": 0.4412352401816102,
"learning_rate": 4.747718648644884e-06,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17034125328063965,
"step": 3785,
"valid_targets_mean": 5354.1,
"valid_targets_min": 652
},
{
"epoch": 5.598227474150665,
"grad_norm": 0.5432056759362457,
"learning_rate": 4.700175048984517e-06,
"loss": 0.137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11455181241035461,
"step": 3790,
"valid_targets_mean": 4452.2,
"valid_targets_min": 513
},
{
"epoch": 5.605612998522895,
"grad_norm": 0.48873939155313356,
"learning_rate": 4.652838982558321e-06,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17513684928417206,
"step": 3795,
"valid_targets_mean": 4769.3,
"valid_targets_min": 688
},
{
"epoch": 5.612998522895126,
"grad_norm": 0.4245229968901909,
"learning_rate": 4.605711091452529e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1345527321100235,
"step": 3800,
"valid_targets_mean": 4822.4,
"valid_targets_min": 320
},
{
"epoch": 5.620384047267356,
"grad_norm": 0.4483079582956929,
"learning_rate": 4.5587920149296e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19811424612998962,
"step": 3805,
"valid_targets_mean": 5786.8,
"valid_targets_min": 641
},
{
"epoch": 5.627769571639586,
"grad_norm": 0.3685763809564081,
"learning_rate": 4.512082389419536e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11352822184562683,
"step": 3810,
"valid_targets_mean": 6317.6,
"valid_targets_min": 610
},
{
"epoch": 5.635155096011816,
"grad_norm": 0.45195450036915635,
"learning_rate": 4.465582848511265e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15802201628684998,
"step": 3815,
"valid_targets_mean": 4964.2,
"valid_targets_min": 637
},
{
"epoch": 5.642540620384048,
"grad_norm": 0.4019080742593427,
"learning_rate": 4.419294022944036e-06,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1530536711215973,
"step": 3820,
"valid_targets_mean": 6357.9,
"valid_targets_min": 669
},
{
"epoch": 5.649926144756278,
"grad_norm": 0.6283549194708017,
"learning_rate": 4.373216540598868e-06,
"loss": 0.1396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17285491526126862,
"step": 3825,
"valid_targets_mean": 3964.8,
"valid_targets_min": 375
},
{
"epoch": 5.657311669128508,
"grad_norm": 0.43312904879288805,
"learning_rate": 4.32735102649003e-06,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14635983109474182,
"step": 3830,
"valid_targets_mean": 6200.1,
"valid_targets_min": 656
},
{
"epoch": 5.664697193500738,
"grad_norm": 0.43595340706555863,
"learning_rate": 4.281698102756568e-06,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1400405317544937,
"step": 3835,
"valid_targets_mean": 5565.6,
"valid_targets_min": 360
},
{
"epoch": 5.672082717872969,
"grad_norm": 0.48135722402982084,
"learning_rate": 4.236258388653862e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20159319043159485,
"step": 3840,
"valid_targets_mean": 5819.4,
"valid_targets_min": 835
},
{
"epoch": 5.6794682422452,
"grad_norm": 0.3965676517017414,
"learning_rate": 4.1910325005452266e-06,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1373254656791687,
"step": 3845,
"valid_targets_mean": 6392.2,
"valid_targets_min": 668
},
{
"epoch": 5.68685376661743,
"grad_norm": 0.42777121231754817,
"learning_rate": 4.146021051893554e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447691023349762,
"step": 3850,
"valid_targets_mean": 5918.9,
"valid_targets_min": 606
},
{
"epoch": 5.69423929098966,
"grad_norm": 0.5369213979278165,
"learning_rate": 4.101224653252984e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14309504628181458,
"step": 3855,
"valid_targets_mean": 4915.6,
"valid_targets_min": 710
},
{
"epoch": 5.701624815361891,
"grad_norm": 0.46685754924383494,
"learning_rate": 4.056643912260634e-06,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14844262599945068,
"step": 3860,
"valid_targets_mean": 4834.6,
"valid_targets_min": 535
},
{
"epoch": 5.709010339734121,
"grad_norm": 0.5069631731010494,
"learning_rate": 4.012279433628339e-06,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17662671208381653,
"step": 3865,
"valid_targets_mean": 4272.2,
"valid_targets_min": 427
},
{
"epoch": 5.716395864106351,
"grad_norm": 0.39028852212572046,
"learning_rate": 3.968131819134484e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14806535840034485,
"step": 3870,
"valid_targets_mean": 7409.1,
"valid_targets_min": 1271
},
{
"epoch": 5.7237813884785815,
"grad_norm": 0.42390110263128356,
"learning_rate": 3.924201667615804e-06,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1607496738433838,
"step": 3875,
"valid_targets_mean": 6367.4,
"valid_targets_min": 773
},
{
"epoch": 5.731166912850813,
"grad_norm": 0.48659182537833057,
"learning_rate": 3.880489574959261e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17565742135047913,
"step": 3880,
"valid_targets_mean": 4721.1,
"valid_targets_min": 679
},
{
"epoch": 5.738552437223043,
"grad_norm": 0.4685263238659188,
"learning_rate": 3.836996134093997e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20819538831710815,
"step": 3885,
"valid_targets_mean": 5287.9,
"valid_targets_min": 524
},
{
"epoch": 5.745937961595273,
"grad_norm": 0.5369846316753283,
"learning_rate": 3.7937219349832633e-06,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16460327804088593,
"step": 3890,
"valid_targets_mean": 3801.6,
"valid_targets_min": 635
},
{
"epoch": 5.7533234859675035,
"grad_norm": 0.41623622826233153,
"learning_rate": 3.750667564616417e-06,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19304777681827545,
"step": 3895,
"valid_targets_mean": 6364.7,
"valid_targets_min": 471
},
{
"epoch": 5.760709010339734,
"grad_norm": 0.43621830231445924,
"learning_rate": 3.7078336070009723e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14152905344963074,
"step": 3900,
"valid_targets_mean": 6270.2,
"valid_targets_min": 298
},
{
"epoch": 5.768094534711965,
"grad_norm": 1.253010108913432,
"learning_rate": 3.665220643154681e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16495048999786377,
"step": 3905,
"valid_targets_mean": 4590.6,
"valid_targets_min": 606
},
{
"epoch": 5.775480059084195,
"grad_norm": 0.46508774999134267,
"learning_rate": 3.622829251097626e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14090654253959656,
"step": 3910,
"valid_targets_mean": 4980.5,
"valid_targets_min": 495
},
{
"epoch": 5.7828655834564255,
"grad_norm": 0.44297068805386,
"learning_rate": 3.5806600058444075e-06,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15334025025367737,
"step": 3915,
"valid_targets_mean": 5535.4,
"valid_targets_min": 573
},
{
"epoch": 5.790251107828656,
"grad_norm": 0.4887477567047723,
"learning_rate": 3.538713479396334e-06,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15382501482963562,
"step": 3920,
"valid_targets_mean": 4043.9,
"valid_targets_min": 553
},
{
"epoch": 5.797636632200886,
"grad_norm": 0.5918387677426872,
"learning_rate": 3.4969902407336532e-06,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1690470576286316,
"step": 3925,
"valid_targets_mean": 3391.9,
"valid_targets_min": 606
},
{
"epoch": 5.805022156573116,
"grad_norm": 0.45735044033920097,
"learning_rate": 3.455490855807855e-06,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19501203298568726,
"step": 3930,
"valid_targets_mean": 5170.4,
"valid_targets_min": 686
},
{
"epoch": 5.812407680945347,
"grad_norm": 0.42972354738525703,
"learning_rate": 3.4142158875339717e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16080421209335327,
"step": 3935,
"valid_targets_mean": 6471.1,
"valid_targets_min": 858
},
{
"epoch": 5.819793205317578,
"grad_norm": 0.4913472734202364,
"learning_rate": 3.373165895782973e-06,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15726235508918762,
"step": 3940,
"valid_targets_mean": 4487.4,
"valid_targets_min": 536
},
{
"epoch": 5.827178729689808,
"grad_norm": 0.3864919394835266,
"learning_rate": 3.332341437374138e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1257772147655487,
"step": 3945,
"valid_targets_mean": 6180.5,
"valid_targets_min": 606
},
{
"epoch": 5.834564254062038,
"grad_norm": 0.4576260726948439,
"learning_rate": 3.2917430660675165e-06,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13794982433319092,
"step": 3950,
"valid_targets_mean": 5125.7,
"valid_targets_min": 562
},
{
"epoch": 5.841949778434269,
"grad_norm": 0.6723128146394246,
"learning_rate": 3.251371332556428e-06,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14654061198234558,
"step": 3955,
"valid_targets_mean": 5167.3,
"valid_targets_min": 379
},
{
"epoch": 5.849335302806499,
"grad_norm": 0.5108031470733075,
"learning_rate": 3.2112267844599686e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15340697765350342,
"step": 3960,
"valid_targets_mean": 4387.8,
"valid_targets_min": 654
},
{
"epoch": 5.85672082717873,
"grad_norm": 0.557035301382823,
"learning_rate": 3.171309966315614e-06,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16433045268058777,
"step": 3965,
"valid_targets_mean": 4127.7,
"valid_targets_min": 490
},
{
"epoch": 5.86410635155096,
"grad_norm": 0.4165972177795746,
"learning_rate": 3.131621419571795e-06,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15628871321678162,
"step": 3970,
"valid_targets_mean": 5658.2,
"valid_targets_min": 563
},
{
"epoch": 5.871491875923191,
"grad_norm": 0.4450131689820263,
"learning_rate": 3.0921616825805834e-06,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15231899917125702,
"step": 3975,
"valid_targets_mean": 5490.5,
"valid_targets_min": 655
},
{
"epoch": 5.878877400295421,
"grad_norm": 0.46785664172207136,
"learning_rate": 3.0529312905903886e-06,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15238377451896667,
"step": 3980,
"valid_targets_mean": 4522.8,
"valid_targets_min": 504
},
{
"epoch": 5.886262924667651,
"grad_norm": 0.49684861734721625,
"learning_rate": 3.013930775738676e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1534469872713089,
"step": 3985,
"valid_targets_mean": 4430.8,
"valid_targets_min": 557
},
{
"epoch": 5.8936484490398815,
"grad_norm": 0.6814697551595089,
"learning_rate": 2.975160667044763e-06,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16581161320209503,
"step": 3990,
"valid_targets_mean": 4855.6,
"valid_targets_min": 570
},
{
"epoch": 5.901033973412112,
"grad_norm": 0.42548375911231223,
"learning_rate": 2.9366214904026445e-06,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1445370763540268,
"step": 3995,
"valid_targets_mean": 5361.6,
"valid_targets_min": 679
},
{
"epoch": 5.908419497784343,
"grad_norm": 0.4413005273888539,
"learning_rate": 2.898313768573857e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14729730784893036,
"step": 4000,
"valid_targets_mean": 5133.8,
"valid_targets_min": 491
},
{
"epoch": 5.915805022156573,
"grad_norm": 0.4985779399517165,
"learning_rate": 2.8602380211803815e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15672720968723297,
"step": 4005,
"valid_targets_mean": 4657.6,
"valid_targets_min": 789
},
{
"epoch": 5.9231905465288035,
"grad_norm": 0.5264213368938573,
"learning_rate": 2.822394764697607e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14332908391952515,
"step": 4010,
"valid_targets_mean": 4761.6,
"valid_targets_min": 289
},
{
"epoch": 5.930576070901034,
"grad_norm": 0.4744288530268933,
"learning_rate": 2.784784512447314e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1922370046377182,
"step": 4015,
"valid_targets_mean": 5348.4,
"valid_targets_min": 853
},
{
"epoch": 5.937961595273264,
"grad_norm": 0.4438269690328926,
"learning_rate": 2.747407774590718e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440523862838745,
"step": 4020,
"valid_targets_mean": 4801.4,
"valid_targets_min": 700
},
{
"epoch": 5.945347119645495,
"grad_norm": 0.3990012691696163,
"learning_rate": 2.7102650581215486e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13657835125923157,
"step": 4025,
"valid_targets_mean": 6708.6,
"valid_targets_min": 648
},
{
"epoch": 5.9527326440177255,
"grad_norm": 0.41646211715971676,
"learning_rate": 2.673356866859167e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15765783190727234,
"step": 4030,
"valid_targets_mean": 5822.4,
"valid_targets_min": 872
},
{
"epoch": 5.960118168389956,
"grad_norm": 0.4931126540910065,
"learning_rate": 2.6366837014417422e-06,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1812196969985962,
"step": 4035,
"valid_targets_mean": 5131.9,
"valid_targets_min": 714
},
{
"epoch": 5.967503692762186,
"grad_norm": 0.4482245693010152,
"learning_rate": 2.6002460593194466e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14398686587810516,
"step": 4040,
"valid_targets_mean": 5426.2,
"valid_targets_min": 384
},
{
"epoch": 5.974889217134416,
"grad_norm": 0.4086296843327063,
"learning_rate": 2.5640444347477255e-06,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505671888589859,
"step": 4045,
"valid_targets_mean": 6444.2,
"valid_targets_min": 477
},
{
"epoch": 5.982274741506647,
"grad_norm": 0.5290771022870968,
"learning_rate": 2.528079318780574e-06,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17048917710781097,
"step": 4050,
"valid_targets_mean": 3984.4,
"valid_targets_min": 495
},
{
"epoch": 5.989660265878878,
"grad_norm": 0.4256479196291018,
"learning_rate": 2.4923511992638895e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14762143790721893,
"step": 4055,
"valid_targets_mean": 5162.6,
"valid_targets_min": 703
},
{
"epoch": 5.997045790251108,
"grad_norm": 0.46850279871296086,
"learning_rate": 2.4568605608288533e-06,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14865565299987793,
"step": 4060,
"valid_targets_mean": 4318.1,
"valid_targets_min": 486
},
{
"epoch": 6.004431314623338,
"grad_norm": 0.5249959190204746,
"learning_rate": 2.4216078848853506e-06,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17384469509124756,
"step": 4065,
"valid_targets_mean": 3995.9,
"valid_targets_min": 477
},
{
"epoch": 6.011816838995569,
"grad_norm": 0.5988657789473296,
"learning_rate": 2.386593649615441e-06,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.151736781001091,
"step": 4070,
"valid_targets_mean": 2800.8,
"valid_targets_min": 451
},
{
"epoch": 6.019202363367799,
"grad_norm": 0.39840181178979595,
"learning_rate": 2.3518183299668796e-06,
"loss": 0.138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13792383670806885,
"step": 4075,
"valid_targets_mean": 5876.8,
"valid_targets_min": 645
},
{
"epoch": 6.026587887740029,
"grad_norm": 0.44045943750338273,
"learning_rate": 2.3172823976466697e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15484324097633362,
"step": 4080,
"valid_targets_mean": 5097.8,
"valid_targets_min": 771
},
{
"epoch": 6.03397341211226,
"grad_norm": 0.4629364970805179,
"learning_rate": 2.282986321114662e-06,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14461535215377808,
"step": 4085,
"valid_targets_mean": 5088.2,
"valid_targets_min": 655
},
{
"epoch": 6.041358936484491,
"grad_norm": 0.40286656062179965,
"learning_rate": 2.2489305655771987e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16793042421340942,
"step": 4090,
"valid_targets_mean": 6758.6,
"valid_targets_min": 832
},
{
"epoch": 6.048744460856721,
"grad_norm": 0.4182839452913791,
"learning_rate": 2.215115592980821e-06,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14046970009803772,
"step": 4095,
"valid_targets_mean": 5969.9,
"valid_targets_min": 640
},
{
"epoch": 6.056129985228951,
"grad_norm": 0.43593965359653836,
"learning_rate": 2.1815418620059824e-06,
"loss": 0.1388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1332874596118927,
"step": 4100,
"valid_targets_mean": 5555.6,
"valid_targets_min": 476
},
{
"epoch": 6.0635155096011815,
"grad_norm": 0.46039610869991315,
"learning_rate": 2.1482098280608234e-06,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2060922533273697,
"step": 4105,
"valid_targets_mean": 5705.4,
"valid_targets_min": 614
},
{
"epoch": 6.070901033973412,
"grad_norm": 0.37373910107719843,
"learning_rate": 2.1151199432750192e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1127336174249649,
"step": 4110,
"valid_targets_mean": 6756.9,
"valid_targets_min": 831
},
{
"epoch": 6.078286558345643,
"grad_norm": 0.44535195342707495,
"learning_rate": 2.082272656493625e-06,
"loss": 0.146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15034779906272888,
"step": 4115,
"valid_targets_mean": 5689.1,
"valid_targets_min": 349
},
{
"epoch": 6.085672082717873,
"grad_norm": 0.5195916162622733,
"learning_rate": 2.049668413271e-06,
"loss": 0.1573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19452224671840668,
"step": 4120,
"valid_targets_mean": 4656.3,
"valid_targets_min": 636
},
{
"epoch": 6.0930576070901035,
"grad_norm": 0.5560703022649638,
"learning_rate": 2.0173076558647487e-06,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14960438013076782,
"step": 4125,
"valid_targets_mean": 4023.4,
"valid_targets_min": 692
},
{
"epoch": 6.100443131462334,
"grad_norm": 0.4749923373792734,
"learning_rate": 1.9851908232297525e-06,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13118794560432434,
"step": 4130,
"valid_targets_mean": 4465.4,
"valid_targets_min": 326
},
{
"epoch": 6.107828655834564,
"grad_norm": 0.4829535285337888,
"learning_rate": 1.9533183510121725e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15433762967586517,
"step": 4135,
"valid_targets_mean": 5477.0,
"valid_targets_min": 621
},
{
"epoch": 6.115214180206794,
"grad_norm": 0.45301666809919827,
"learning_rate": 1.9216906715435744e-06,
"loss": 0.1414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1339162439107895,
"step": 4140,
"valid_targets_mean": 4647.9,
"valid_targets_min": 761
},
{
"epoch": 6.1225997045790255,
"grad_norm": 0.39338422495107067,
"learning_rate": 1.8903082138350548e-06,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1282079815864563,
"step": 4145,
"valid_targets_mean": 5771.3,
"valid_targets_min": 425
},
{
"epoch": 6.129985228951256,
"grad_norm": 0.44371532394815066,
"learning_rate": 1.8591714035714049e-06,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16418243944644928,
"step": 4150,
"valid_targets_mean": 5660.0,
"valid_targets_min": 479
},
{
"epoch": 6.137370753323486,
"grad_norm": 0.48563406133620735,
"learning_rate": 1.8282806631053662e-06,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16766785085201263,
"step": 4155,
"valid_targets_mean": 4655.8,
"valid_targets_min": 433
},
{
"epoch": 6.144756277695716,
"grad_norm": 0.6072416236863333,
"learning_rate": 1.7976364114518796e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494389772415161,
"step": 4160,
"valid_targets_mean": 3736.5,
"valid_targets_min": 491
},
{
"epoch": 6.152141802067947,
"grad_norm": 0.50481142735507,
"learning_rate": 1.7672390642824156e-06,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17777088284492493,
"step": 4165,
"valid_targets_mean": 4276.0,
"valid_targets_min": 666
},
{
"epoch": 6.159527326440177,
"grad_norm": 0.42071660129307986,
"learning_rate": 1.7370890339193191e-06,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1517738252878189,
"step": 4170,
"valid_targets_mean": 6217.3,
"valid_targets_min": 747
},
{
"epoch": 6.166912850812408,
"grad_norm": 0.4290485201318066,
"learning_rate": 1.7071867293302325e-06,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1593089997768402,
"step": 4175,
"valid_targets_mean": 5545.1,
"valid_targets_min": 765
},
{
"epoch": 6.174298375184638,
"grad_norm": 0.43744895390706484,
"learning_rate": 1.6775325561225409e-06,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13858440518379211,
"step": 4180,
"valid_targets_mean": 5377.1,
"valid_targets_min": 466
},
{
"epoch": 6.181683899556869,
"grad_norm": 0.4262626698684947,
"learning_rate": 1.648126916537871e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14648282527923584,
"step": 4185,
"valid_targets_mean": 5709.4,
"valid_targets_min": 654
},
{
"epoch": 6.189069423929099,
"grad_norm": 0.47051468258097345,
"learning_rate": 1.6189702094466309e-06,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1473892331123352,
"step": 4190,
"valid_targets_mean": 4704.9,
"valid_targets_min": 755
},
{
"epoch": 6.196454948301329,
"grad_norm": 0.49070628134476585,
"learning_rate": 1.5900628303426114e-06,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15285709500312805,
"step": 4195,
"valid_targets_mean": 4618.8,
"valid_targets_min": 530
},
{
"epoch": 6.203840472673559,
"grad_norm": 0.4253518994986448,
"learning_rate": 1.5614051713376066e-06,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15116259455680847,
"step": 4200,
"valid_targets_mean": 5736.6,
"valid_targets_min": 412
},
{
"epoch": 6.211225997045791,
"grad_norm": 0.4641185127939372,
"learning_rate": 1.5329976211561138e-06,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20113864541053772,
"step": 4205,
"valid_targets_mean": 5099.3,
"valid_targets_min": 529
},
{
"epoch": 6.218611521418021,
"grad_norm": 0.39647752417172666,
"learning_rate": 1.504840565130039e-06,
"loss": 0.1464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13573205471038818,
"step": 4210,
"valid_targets_mean": 6350.6,
"valid_targets_min": 711
},
{
"epoch": 6.225997045790251,
"grad_norm": 0.48103069316244723,
"learning_rate": 1.4769343851934847e-06,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1464741975069046,
"step": 4215,
"valid_targets_mean": 4600.5,
"valid_targets_min": 514
},
{
"epoch": 6.233382570162481,
"grad_norm": 0.40232624403233436,
"learning_rate": 1.4492794598775661e-06,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13256195187568665,
"step": 4220,
"valid_targets_mean": 6487.2,
"valid_targets_min": 679
},
{
"epoch": 6.240768094534712,
"grad_norm": 0.5055273590949532,
"learning_rate": 1.4218761643052692e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15635859966278076,
"step": 4225,
"valid_targets_mean": 4193.4,
"valid_targets_min": 721
},
{
"epoch": 6.248153618906942,
"grad_norm": 0.43866996029377286,
"learning_rate": 1.3947248701863813e-06,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16044774651527405,
"step": 4230,
"valid_targets_mean": 5434.1,
"valid_targets_min": 541
},
{
"epoch": 6.255539143279173,
"grad_norm": 0.49231511408163975,
"learning_rate": 1.3678259458124177e-06,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13283999264240265,
"step": 4235,
"valid_targets_mean": 4179.0,
"valid_targets_min": 800
},
{
"epoch": 6.262924667651403,
"grad_norm": 0.4230623819145653,
"learning_rate": 1.3411797560516627e-06,
"loss": 0.1344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1318785846233368,
"step": 4240,
"valid_targets_mean": 6249.6,
"valid_targets_min": 703
},
{
"epoch": 6.270310192023634,
"grad_norm": 0.46935895443155884,
"learning_rate": 1.314786662344194e-06,
"loss": 0.1497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17924916744232178,
"step": 4245,
"valid_targets_mean": 5661.8,
"valid_targets_min": 570
},
{
"epoch": 6.277695716395864,
"grad_norm": 0.3888317431003321,
"learning_rate": 1.2886470226969895e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13889117538928986,
"step": 4250,
"valid_targets_mean": 6869.9,
"valid_targets_min": 990
},
{
"epoch": 6.285081240768094,
"grad_norm": 0.4352449485035959,
"learning_rate": 1.2627611916790715e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14910173416137695,
"step": 4255,
"valid_targets_mean": 5603.9,
"valid_targets_min": 491
},
{
"epoch": 6.2924667651403245,
"grad_norm": 0.40749937475334613,
"learning_rate": 1.237129520416691e-06,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15692628920078278,
"step": 4260,
"valid_targets_mean": 6081.8,
"valid_targets_min": 831
},
{
"epoch": 6.299852289512556,
"grad_norm": 0.4037894828650866,
"learning_rate": 1.211752356588578e-06,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13675357401371002,
"step": 4265,
"valid_targets_mean": 6421.4,
"valid_targets_min": 457
},
{
"epoch": 6.307237813884786,
"grad_norm": 0.5205689683666549,
"learning_rate": 1.1866300444212108e-06,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15477876365184784,
"step": 4270,
"valid_targets_mean": 3994.2,
"valid_targets_min": 546
},
{
"epoch": 6.314623338257016,
"grad_norm": 0.5661967143739712,
"learning_rate": 1.161762924684151e-06,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15488114953041077,
"step": 4275,
"valid_targets_mean": 4311.4,
"valid_targets_min": 541
},
{
"epoch": 6.3220088626292466,
"grad_norm": 0.4837147960209401,
"learning_rate": 1.1371513346854313e-06,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16949772834777832,
"step": 4280,
"valid_targets_mean": 4836.6,
"valid_targets_min": 493
},
{
"epoch": 6.329394387001477,
"grad_norm": 0.5432762673776387,
"learning_rate": 1.1127956082669633e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18372945487499237,
"step": 4285,
"valid_targets_mean": 4226.1,
"valid_targets_min": 707
},
{
"epoch": 6.336779911373707,
"grad_norm": 0.5144469478911506,
"learning_rate": 1.0886960758000265e-06,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16694745421409607,
"step": 4290,
"valid_targets_mean": 3961.9,
"valid_targets_min": 400
},
{
"epoch": 6.344165435745938,
"grad_norm": 0.43923637649600045,
"learning_rate": 1.0648530641807686e-06,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1794458031654358,
"step": 4295,
"valid_targets_mean": 5821.2,
"valid_targets_min": 526
},
{
"epoch": 6.3515509601181686,
"grad_norm": 0.5123527090839185,
"learning_rate": 1.0412668968257877e-06,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14006029069423676,
"step": 4300,
"valid_targets_mean": 4426.3,
"valid_targets_min": 781
},
{
"epoch": 6.358936484490399,
"grad_norm": 0.4115851655709371,
"learning_rate": 1.0179378936677397e-06,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542370468378067,
"step": 4305,
"valid_targets_mean": 5933.6,
"valid_targets_min": 666
},
{
"epoch": 6.366322008862629,
"grad_norm": 0.5258862879779717,
"learning_rate": 9.948663711509954e-07,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15517973899841309,
"step": 4310,
"valid_targets_mean": 4407.2,
"valid_targets_min": 586
},
{
"epoch": 6.373707533234859,
"grad_norm": 0.44159616792495127,
"learning_rate": 9.720526422273412e-07,
"loss": 0.1512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1318591982126236,
"step": 4315,
"valid_targets_mean": 5543.4,
"valid_targets_min": 841
},
{
"epoch": 6.381093057607091,
"grad_norm": 0.49990677130913785,
"learning_rate": 9.494970163517681e-07,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15071862936019897,
"step": 4320,
"valid_targets_mean": 4528.5,
"valid_targets_min": 573
},
{
"epoch": 6.388478581979321,
"grad_norm": 0.4164585567607767,
"learning_rate": 9.2719979947822e-07,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15653051435947418,
"step": 4325,
"valid_targets_mean": 6323.8,
"valid_targets_min": 490
},
{
"epoch": 6.395864106351551,
"grad_norm": 0.5160481333349497,
"learning_rate": 9.051612940554899e-07,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1293860673904419,
"step": 4330,
"valid_targets_mean": 4956.7,
"valid_targets_min": 796
},
{
"epoch": 6.403249630723781,
"grad_norm": 0.5499032197777276,
"learning_rate": 8.833817990230953e-07,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15469960868358612,
"step": 4335,
"valid_targets_mean": 4249.5,
"valid_targets_min": 324
},
{
"epoch": 6.410635155096012,
"grad_norm": 0.40152843519987197,
"learning_rate": 8.61861609807233e-07,
"loss": 0.1432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11483586579561234,
"step": 4340,
"valid_targets_mean": 6111.3,
"valid_targets_min": 712
},
{
"epoch": 6.418020679468242,
"grad_norm": 0.42446425379167474,
"learning_rate": 8.406010183167601e-07,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1487945318222046,
"step": 4345,
"valid_targets_mean": 7079.7,
"valid_targets_min": 685
},
{
"epoch": 6.425406203840472,
"grad_norm": 0.7413738678926328,
"learning_rate": 8.196003129392438e-07,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16445940732955933,
"step": 4350,
"valid_targets_mean": 3112.4,
"valid_targets_min": 548
},
{
"epoch": 6.432791728212703,
"grad_norm": 0.44560225337100395,
"learning_rate": 7.988597785370533e-07,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12470986694097519,
"step": 4355,
"valid_targets_mean": 5328.5,
"valid_targets_min": 257
},
{
"epoch": 6.440177252584934,
"grad_norm": 0.4745632975601192,
"learning_rate": 7.783796964434831e-07,
"loss": 0.1434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16859686374664307,
"step": 4360,
"valid_targets_mean": 5014.4,
"valid_targets_min": 726
},
{
"epoch": 6.447562776957164,
"grad_norm": 0.4642679768852893,
"learning_rate": 7.581603444589447e-07,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13736671209335327,
"step": 4365,
"valid_targets_mean": 4825.1,
"valid_targets_min": 528
},
{
"epoch": 6.454948301329394,
"grad_norm": 0.4434842107811936,
"learning_rate": 7.382019968471943e-07,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14103060960769653,
"step": 4370,
"valid_targets_mean": 5577.3,
"valid_targets_min": 552
},
{
"epoch": 6.4623338257016245,
"grad_norm": 0.503057563707869,
"learning_rate": 7.185049243316222e-07,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14642839133739471,
"step": 4375,
"valid_targets_mean": 4761.9,
"valid_targets_min": 652
},
{
"epoch": 6.469719350073856,
"grad_norm": 0.6276381062918326,
"learning_rate": 6.990693940915694e-07,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24949908256530762,
"step": 4380,
"valid_targets_mean": 3993.2,
"valid_targets_min": 535
},
{
"epoch": 6.477104874446086,
"grad_norm": 0.4926903015244238,
"learning_rate": 6.798956697587079e-07,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1511232703924179,
"step": 4385,
"valid_targets_mean": 4615.3,
"valid_targets_min": 595
},
{
"epoch": 6.484490398818316,
"grad_norm": 0.49283910568013917,
"learning_rate": 6.60984011413468e-07,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16701708734035492,
"step": 4390,
"valid_targets_mean": 4338.4,
"valid_targets_min": 645
},
{
"epoch": 6.4918759231905465,
"grad_norm": 0.5002990883414868,
"learning_rate": 6.423346755815019e-07,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13407056033611298,
"step": 4395,
"valid_targets_mean": 4023.8,
"valid_targets_min": 658
},
{
"epoch": 6.499261447562777,
"grad_norm": 0.5338641891206741,
"learning_rate": 6.239479152302164e-07,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17522169649600983,
"step": 4400,
"valid_targets_mean": 4392.1,
"valid_targets_min": 670
},
{
"epoch": 6.506646971935007,
"grad_norm": 0.5484669473808206,
"learning_rate": 6.058239797653276e-07,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1687406748533249,
"step": 4405,
"valid_targets_mean": 4462.4,
"valid_targets_min": 482
},
{
"epoch": 6.514032496307237,
"grad_norm": 0.5639609310377635,
"learning_rate": 5.879631150274901e-07,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15761615335941315,
"step": 4410,
"valid_targets_mean": 4938.3,
"valid_targets_min": 271
},
{
"epoch": 6.5214180206794685,
"grad_norm": 0.4302419740392286,
"learning_rate": 5.703655632889505e-07,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12143665552139282,
"step": 4415,
"valid_targets_mean": 6462.4,
"valid_targets_min": 537
},
{
"epoch": 6.528803545051699,
"grad_norm": 0.4018145246408569,
"learning_rate": 5.530315632502725e-07,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15424439311027527,
"step": 4420,
"valid_targets_mean": 7003.6,
"valid_targets_min": 650
},
{
"epoch": 6.536189069423929,
"grad_norm": 0.4280985946691859,
"learning_rate": 5.359613500370931e-07,
"loss": 0.1626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13937228918075562,
"step": 4425,
"valid_targets_mean": 5996.9,
"valid_targets_min": 928
},
{
"epoch": 6.543574593796159,
"grad_norm": 0.512095968806376,
"learning_rate": 5.191551551969376e-07,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1761317402124405,
"step": 4430,
"valid_targets_mean": 5061.4,
"valid_targets_min": 639
},
{
"epoch": 6.55096011816839,
"grad_norm": 0.42658213407812473,
"learning_rate": 5.026132066960699e-07,
"loss": 0.1372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12839290499687195,
"step": 4435,
"valid_targets_mean": 6122.6,
"valid_targets_min": 989
},
{
"epoch": 6.558345642540621,
"grad_norm": 0.43584162901665235,
"learning_rate": 4.863357289164094e-07,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13353732228279114,
"step": 4440,
"valid_targets_mean": 5793.8,
"valid_targets_min": 774
},
{
"epoch": 6.565731166912851,
"grad_norm": 0.5121854270322571,
"learning_rate": 4.703229426524836e-07,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140175461769104,
"step": 4445,
"valid_targets_mean": 6360.8,
"valid_targets_min": 825
},
{
"epoch": 6.573116691285081,
"grad_norm": 0.4891587376138227,
"learning_rate": 4.545750651084291e-07,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1598307192325592,
"step": 4450,
"valid_targets_mean": 5076.1,
"valid_targets_min": 641
},
{
"epoch": 6.580502215657312,
"grad_norm": 0.48474954710037227,
"learning_rate": 4.3909230989505724e-07,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15411385893821716,
"step": 4455,
"valid_targets_mean": 4396.3,
"valid_targets_min": 641
},
{
"epoch": 6.587887740029542,
"grad_norm": 0.48095262700952346,
"learning_rate": 4.2387488702693823e-07,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15224063396453857,
"step": 4460,
"valid_targets_mean": 4503.4,
"valid_targets_min": 612
},
{
"epoch": 6.595273264401772,
"grad_norm": 0.42397246226943786,
"learning_rate": 4.0892300291957674e-07,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14690491557121277,
"step": 4465,
"valid_targets_mean": 5915.6,
"valid_targets_min": 495
},
{
"epoch": 6.6026587887740025,
"grad_norm": 0.43317383963947165,
"learning_rate": 3.942368603865898e-07,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13303223252296448,
"step": 4470,
"valid_targets_mean": 5465.1,
"valid_targets_min": 1317
},
{
"epoch": 6.610044313146234,
"grad_norm": 0.4006775023374142,
"learning_rate": 3.798166586369645e-07,
"loss": 0.1374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15547743439674377,
"step": 4475,
"valid_targets_mean": 7271.6,
"valid_targets_min": 636
},
{
"epoch": 6.617429837518464,
"grad_norm": 0.4117824406720461,
"learning_rate": 3.656625932723579e-07,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13841594755649567,
"step": 4480,
"valid_targets_mean": 6281.6,
"valid_targets_min": 685
},
{
"epoch": 6.624815361890694,
"grad_norm": 0.5336042505216406,
"learning_rate": 3.5177485628444363e-07,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1793767213821411,
"step": 4485,
"valid_targets_mean": 4352.6,
"valid_targets_min": 603
},
{
"epoch": 6.6322008862629245,
"grad_norm": 0.44302761320669076,
"learning_rate": 3.381536360523008e-07,
"loss": 0.1375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14193832874298096,
"step": 4490,
"valid_targets_mean": 5695.8,
"valid_targets_min": 734
},
{
"epoch": 6.639586410635155,
"grad_norm": 0.4383730918433756,
"learning_rate": 3.247991173398668e-07,
"loss": 0.1321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1333121955394745,
"step": 4495,
"valid_targets_mean": 5675.1,
"valid_targets_min": 622
},
{
"epoch": 6.646971935007386,
"grad_norm": 0.5170425717885939,
"learning_rate": 3.117114812934263e-07,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605900526046753,
"step": 4500,
"valid_targets_mean": 4572.1,
"valid_targets_min": 575
},
{
"epoch": 6.654357459379616,
"grad_norm": 0.48806033544384714,
"learning_rate": 2.988909054391598e-07,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1332065463066101,
"step": 4505,
"valid_targets_mean": 4321.8,
"valid_targets_min": 573
},
{
"epoch": 6.6617429837518465,
"grad_norm": 0.37245789606924895,
"learning_rate": 2.8633756368072307e-07,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11881101131439209,
"step": 4510,
"valid_targets_mean": 6310.8,
"valid_targets_min": 803
},
{
"epoch": 6.669128508124077,
"grad_norm": 0.4549884322992929,
"learning_rate": 2.740516262969051e-07,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540367156267166,
"step": 4515,
"valid_targets_mean": 5073.8,
"valid_targets_min": 637
},
{
"epoch": 6.676514032496307,
"grad_norm": 0.4944141719547407,
"learning_rate": 2.6203325993930717e-07,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11980420351028442,
"step": 4520,
"valid_targets_mean": 4708.9,
"valid_targets_min": 499
},
{
"epoch": 6.683899556868537,
"grad_norm": 0.5049668775794947,
"learning_rate": 2.5028262763008514e-07,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17368857562541962,
"step": 4525,
"valid_targets_mean": 4323.2,
"valid_targets_min": 529
},
{
"epoch": 6.691285081240768,
"grad_norm": 0.39940995378060945,
"learning_rate": 2.3879988875973314e-07,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12155850231647491,
"step": 4530,
"valid_targets_mean": 6206.7,
"valid_targets_min": 552
},
{
"epoch": 6.698670605612999,
"grad_norm": 0.4013521013669753,
"learning_rate": 2.2758519908493648e-07,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15022462606430054,
"step": 4535,
"valid_targets_mean": 6336.5,
"valid_targets_min": 630
},
{
"epoch": 6.706056129985229,
"grad_norm": 0.5620177209255185,
"learning_rate": 2.1663871072643784e-07,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16755668818950653,
"step": 4540,
"valid_targets_mean": 3727.6,
"valid_targets_min": 390
},
{
"epoch": 6.713441654357459,
"grad_norm": 0.5258801995748262,
"learning_rate": 2.059605721669966e-07,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14239409565925598,
"step": 4545,
"valid_targets_mean": 4034.1,
"valid_targets_min": 540
},
{
"epoch": 6.72082717872969,
"grad_norm": 0.4560448915232561,
"learning_rate": 1.9555092824935062e-07,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1599361002445221,
"step": 4550,
"valid_targets_mean": 5137.9,
"valid_targets_min": 310
},
{
"epoch": 6.72821270310192,
"grad_norm": 0.46957544677234575,
"learning_rate": 1.854099201742754e-07,
"loss": 0.1469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13492749631404877,
"step": 4555,
"valid_targets_mean": 5321.8,
"valid_targets_min": 486
},
{
"epoch": 6.735598227474151,
"grad_norm": 0.4893832374792917,
"learning_rate": 1.7553768549864791e-07,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1458035260438919,
"step": 4560,
"valid_targets_mean": 4632.6,
"valid_targets_min": 723
},
{
"epoch": 6.742983751846381,
"grad_norm": 0.49924643293505594,
"learning_rate": 1.6593435813359704e-07,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1429969072341919,
"step": 4565,
"valid_targets_mean": 5114.1,
"valid_targets_min": 573
},
{
"epoch": 6.750369276218612,
"grad_norm": 0.5588546086896948,
"learning_rate": 1.5660006834267826e-07,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17076215147972107,
"step": 4570,
"valid_targets_mean": 3644.6,
"valid_targets_min": 462
},
{
"epoch": 6.757754800590842,
"grad_norm": 0.44934370220938186,
"learning_rate": 1.4753494274010404e-07,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12686952948570251,
"step": 4575,
"valid_targets_mean": 4405.2,
"valid_targets_min": 532
},
{
"epoch": 6.765140324963072,
"grad_norm": 0.40287819658097046,
"learning_rate": 1.387391042890407e-07,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1626736968755722,
"step": 4580,
"valid_targets_mean": 6230.9,
"valid_targets_min": 471
},
{
"epoch": 6.772525849335302,
"grad_norm": 0.39016310022420664,
"learning_rate": 1.3021267229992307e-07,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13419151306152344,
"step": 4585,
"valid_targets_mean": 5865.1,
"valid_targets_min": 552
},
{
"epoch": 6.779911373707534,
"grad_norm": 0.48929349503037056,
"learning_rate": 1.2195576242884256e-07,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16033774614334106,
"step": 4590,
"valid_targets_mean": 4465.0,
"valid_targets_min": 462
},
{
"epoch": 6.787296898079764,
"grad_norm": 0.4099040200611785,
"learning_rate": 1.1396848667598826e-07,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13809999823570251,
"step": 4595,
"valid_targets_mean": 5768.4,
"valid_targets_min": 562
},
{
"epoch": 6.794682422451994,
"grad_norm": 0.47774449623791543,
"learning_rate": 1.0625095338411051e-07,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1699640303850174,
"step": 4600,
"valid_targets_mean": 4953.6,
"valid_targets_min": 553
},
{
"epoch": 6.802067946824224,
"grad_norm": 0.5076200380883104,
"learning_rate": 9.880326723706646e-08,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1531982421875,
"step": 4605,
"valid_targets_mean": 4243.5,
"valid_targets_min": 575
},
{
"epoch": 6.809453471196455,
"grad_norm": 0.5365924598906461,
"learning_rate": 9.162552925838564e-08,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19307509064674377,
"step": 4610,
"valid_targets_mean": 4674.6,
"valid_targets_min": 577
},
{
"epoch": 6.816838995568685,
"grad_norm": 0.4114855170974802,
"learning_rate": 8.471783680991774e-08,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11866377294063568,
"step": 4615,
"valid_targets_mean": 5945.6,
"valid_targets_min": 500
},
{
"epoch": 6.824224519940916,
"grad_norm": 0.4311591899524311,
"learning_rate": 7.80802835904959e-08,
"loss": 0.137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13947513699531555,
"step": 4620,
"valid_targets_mean": 5683.1,
"valid_targets_min": 634
},
{
"epoch": 6.8316100443131464,
"grad_norm": 0.5619454499028758,
"learning_rate": 7.171295963466884e-08,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1453944444656372,
"step": 4625,
"valid_targets_mean": 4229.2,
"valid_targets_min": 517
},
{
"epoch": 6.838995568685377,
"grad_norm": 0.43973530083348866,
"learning_rate": 6.561595131149068e-08,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15559229254722595,
"step": 4630,
"valid_targets_mean": 5828.9,
"valid_targets_min": 731
},
{
"epoch": 6.846381093057607,
"grad_norm": 0.46646297249339624,
"learning_rate": 5.97893413233308e-08,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13109324872493744,
"step": 4635,
"valid_targets_mean": 4558.2,
"valid_targets_min": 721
},
{
"epoch": 6.853766617429837,
"grad_norm": 0.5158968571743305,
"learning_rate": 5.4233208704770336e-08,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18643151223659515,
"step": 4640,
"valid_targets_mean": 4622.7,
"valid_targets_min": 529
},
{
"epoch": 6.861152141802068,
"grad_norm": 0.42120731834961433,
"learning_rate": 4.894762882151849e-08,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12933212518692017,
"step": 4645,
"valid_targets_mean": 5539.8,
"valid_targets_min": 516
},
{
"epoch": 6.868537666174299,
"grad_norm": 0.4701920136133854,
"learning_rate": 4.393267336939566e-08,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16911543905735016,
"step": 4650,
"valid_targets_mean": 5174.4,
"valid_targets_min": 494
},
{
"epoch": 6.875923190546529,
"grad_norm": 0.4483722090071213,
"learning_rate": 3.9188410373358635e-08,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23113879561424255,
"step": 4655,
"valid_targets_mean": 6327.1,
"valid_targets_min": 597
},
{
"epoch": 6.883308714918759,
"grad_norm": 0.4700078471031414,
"learning_rate": 3.471490418657686e-08,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15961627662181854,
"step": 4660,
"valid_targets_mean": 5725.3,
"valid_targets_min": 648
},
{
"epoch": 6.89069423929099,
"grad_norm": 0.4655597595051389,
"learning_rate": 3.051221548956207e-08,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12833762168884277,
"step": 4665,
"valid_targets_mean": 4711.9,
"valid_targets_min": 725
},
{
"epoch": 6.89807976366322,
"grad_norm": 0.6380093111909683,
"learning_rate": 2.6580401289344472e-08,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340949535369873,
"step": 4670,
"valid_targets_mean": 3719.6,
"valid_targets_min": 521
},
{
"epoch": 6.905465288035451,
"grad_norm": 0.42232440957412026,
"learning_rate": 2.2919514918700038e-08,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13673587143421173,
"step": 4675,
"valid_targets_mean": 6005.1,
"valid_targets_min": 567
},
{
"epoch": 6.912850812407681,
"grad_norm": 0.4656904084131196,
"learning_rate": 1.95296060354222e-08,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1485702097415924,
"step": 4680,
"valid_targets_mean": 5101.6,
"valid_targets_min": 579
},
{
"epoch": 6.920236336779912,
"grad_norm": 0.4808238353600059,
"learning_rate": 1.6410720621655718e-08,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1313798427581787,
"step": 4685,
"valid_targets_mean": 6804.3,
"valid_targets_min": 819
},
{
"epoch": 6.927621861152142,
"grad_norm": 0.4233348673449903,
"learning_rate": 1.356290098327051e-08,
"loss": 0.1553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15477396547794342,
"step": 4690,
"valid_targets_mean": 6435.8,
"valid_targets_min": 699
},
{
"epoch": 6.935007385524372,
"grad_norm": 0.43007196837079203,
"learning_rate": 1.0986185749282118e-08,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11044066399335861,
"step": 4695,
"valid_targets_mean": 5944.6,
"valid_targets_min": 229
},
{
"epoch": 6.942392909896602,
"grad_norm": 0.5232298527072103,
"learning_rate": 8.680609871338786e-09,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18600329756736755,
"step": 4700,
"valid_targets_mean": 4885.4,
"valid_targets_min": 799
},
{
"epoch": 6.949778434268833,
"grad_norm": 0.6339786906635847,
"learning_rate": 6.646204623232954e-09,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21870045363903046,
"step": 4705,
"valid_targets_mean": 3441.2,
"valid_targets_min": 526
},
{
"epoch": 6.957163958641064,
"grad_norm": 0.3930755994701203,
"learning_rate": 4.882997600494932e-09,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12523368000984192,
"step": 4710,
"valid_targets_mean": 6379.2,
"valid_targets_min": 563
},
{
"epoch": 6.964549483013294,
"grad_norm": 0.46455499149966306,
"learning_rate": 3.3910127199998643e-09,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1395748257637024,
"step": 4715,
"valid_targets_mean": 5036.2,
"valid_targets_min": 476
},
{
"epoch": 6.971935007385524,
"grad_norm": 0.5569847284562671,
"learning_rate": 2.170270219654658e-09,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16902390122413635,
"step": 4720,
"valid_targets_mean": 4324.9,
"valid_targets_min": 542
},
{
"epoch": 6.979320531757755,
"grad_norm": 0.4994292568305981,
"learning_rate": 1.2207866581248617e-09,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15097226202487946,
"step": 4725,
"valid_targets_mean": 4825.1,
"valid_targets_min": 314
},
{
"epoch": 6.986706056129985,
"grad_norm": 0.4317365485031485,
"learning_rate": 5.425749146015235e-10,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14707861840724945,
"step": 4730,
"valid_targets_mean": 6297.3,
"valid_targets_min": 696
},
{
"epoch": 6.994091580502216,
"grad_norm": 0.43567574617565746,
"learning_rate": 1.3564418863465378e-10,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13918901979923248,
"step": 4735,
"valid_targets_mean": 5156.8,
"valid_targets_min": 633
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13066400587558746,
"step": 4739,
"total_flos": 1781000233680896.0,
"train_loss": 0.19506101114987875,
"train_runtime": 33204.2929,
"train_samples_per_second": 2.281,
"train_steps_per_second": 0.143,
"valid_targets_mean": 5264.3,
"valid_targets_min": 320
}
],
"logging_steps": 5,
"max_steps": 4739,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1781000233680896.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}