Files
a1-stackexchange_superuser/trainer_state.json
ModelHub XC 7242c9cf82 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-stackexchange_superuser
Source: Original Platform
2026-05-11 12:07:52 +08:00

9684 lines
268 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4382,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007987220447284345,
"grad_norm": 15.17248931781073,
"learning_rate": 3.644646924829157e-07,
"loss": 0.9519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.873810887336731,
"step": 5,
"valid_targets_mean": 3127.7,
"valid_targets_min": 927
},
{
"epoch": 0.01597444089456869,
"grad_norm": 16.0447046422443,
"learning_rate": 8.200455580865605e-07,
"loss": 0.9762,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.0120545625686646,
"step": 10,
"valid_targets_mean": 2819.0,
"valid_targets_min": 1221
},
{
"epoch": 0.023961661341853034,
"grad_norm": 15.982841317309331,
"learning_rate": 1.2756264236902052e-06,
"loss": 0.9655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9404536485671997,
"step": 15,
"valid_targets_mean": 2939.2,
"valid_targets_min": 1003
},
{
"epoch": 0.03194888178913738,
"grad_norm": 16.68150841790565,
"learning_rate": 1.7312072892938498e-06,
"loss": 0.9297,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.0098234415054321,
"step": 20,
"valid_targets_mean": 2228.9,
"valid_targets_min": 1122
},
{
"epoch": 0.039936102236421724,
"grad_norm": 7.699726336060192,
"learning_rate": 2.1867881548974945e-06,
"loss": 0.883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8025753498077393,
"step": 25,
"valid_targets_mean": 3127.9,
"valid_targets_min": 978
},
{
"epoch": 0.04792332268370607,
"grad_norm": 5.236211849772423,
"learning_rate": 2.642369020501139e-06,
"loss": 0.825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7962996959686279,
"step": 30,
"valid_targets_mean": 2854.4,
"valid_targets_min": 1089
},
{
"epoch": 0.05591054313099041,
"grad_norm": 3.7746117759364175,
"learning_rate": 3.0979498861047843e-06,
"loss": 0.7731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7613115310668945,
"step": 35,
"valid_targets_mean": 2395.0,
"valid_targets_min": 1120
},
{
"epoch": 0.06389776357827476,
"grad_norm": 2.169032644755572,
"learning_rate": 3.5535307517084285e-06,
"loss": 0.7068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7297231554985046,
"step": 40,
"valid_targets_mean": 2835.4,
"valid_targets_min": 1046
},
{
"epoch": 0.07188498402555911,
"grad_norm": 1.8529712575405926,
"learning_rate": 4.009111617312073e-06,
"loss": 0.7178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7068992853164673,
"step": 45,
"valid_targets_mean": 2749.2,
"valid_targets_min": 1262
},
{
"epoch": 0.07987220447284345,
"grad_norm": 1.74129413182321,
"learning_rate": 4.464692482915718e-06,
"loss": 0.7158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7441062927246094,
"step": 50,
"valid_targets_mean": 2308.6,
"valid_targets_min": 895
},
{
"epoch": 0.0878594249201278,
"grad_norm": 1.1261969765312332,
"learning_rate": 4.920273348519363e-06,
"loss": 0.6573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6407957673072815,
"step": 55,
"valid_targets_mean": 2901.4,
"valid_targets_min": 1280
},
{
"epoch": 0.09584664536741214,
"grad_norm": 1.189556858462003,
"learning_rate": 5.375854214123008e-06,
"loss": 0.682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6844934821128845,
"step": 60,
"valid_targets_mean": 2235.0,
"valid_targets_min": 1097
},
{
"epoch": 0.10383386581469649,
"grad_norm": 1.0707090957182381,
"learning_rate": 5.831435079726651e-06,
"loss": 0.6523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6878713965415955,
"step": 65,
"valid_targets_mean": 2627.6,
"valid_targets_min": 1230
},
{
"epoch": 0.11182108626198083,
"grad_norm": 1.0142874088661866,
"learning_rate": 6.287015945330297e-06,
"loss": 0.6362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6870459914207458,
"step": 70,
"valid_targets_mean": 2840.0,
"valid_targets_min": 1380
},
{
"epoch": 0.11980830670926518,
"grad_norm": 0.8175505785622187,
"learning_rate": 6.742596810933942e-06,
"loss": 0.643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6377227306365967,
"step": 75,
"valid_targets_mean": 3428.4,
"valid_targets_min": 1015
},
{
"epoch": 0.12779552715654952,
"grad_norm": 0.9047440311266008,
"learning_rate": 7.1981776765375854e-06,
"loss": 0.6375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5993684530258179,
"step": 80,
"valid_targets_mean": 2613.2,
"valid_targets_min": 855
},
{
"epoch": 0.13578274760383385,
"grad_norm": 0.8299903165340285,
"learning_rate": 7.65375854214123e-06,
"loss": 0.6111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5948533415794373,
"step": 85,
"valid_targets_mean": 2690.9,
"valid_targets_min": 1286
},
{
"epoch": 0.14376996805111822,
"grad_norm": 0.9198314766136052,
"learning_rate": 8.109339407744875e-06,
"loss": 0.6151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5966804027557373,
"step": 90,
"valid_targets_mean": 2349.4,
"valid_targets_min": 1028
},
{
"epoch": 0.15175718849840256,
"grad_norm": 0.7995206251913056,
"learning_rate": 8.564920273348521e-06,
"loss": 0.5595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47535890340805054,
"step": 95,
"valid_targets_mean": 2481.7,
"valid_targets_min": 1112
},
{
"epoch": 0.1597444089456869,
"grad_norm": 0.8508182370502543,
"learning_rate": 9.020501138952164e-06,
"loss": 0.5852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6482516527175903,
"step": 100,
"valid_targets_mean": 2932.8,
"valid_targets_min": 1364
},
{
"epoch": 0.16773162939297126,
"grad_norm": 0.8203564655537686,
"learning_rate": 9.47608200455581e-06,
"loss": 0.548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5478312969207764,
"step": 105,
"valid_targets_mean": 2946.6,
"valid_targets_min": 931
},
{
"epoch": 0.1757188498402556,
"grad_norm": 0.7569799752444644,
"learning_rate": 9.931662870159453e-06,
"loss": 0.5804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5435867309570312,
"step": 110,
"valid_targets_mean": 3103.2,
"valid_targets_min": 1609
},
{
"epoch": 0.18370607028753994,
"grad_norm": 0.8900695073471566,
"learning_rate": 1.03872437357631e-05,
"loss": 0.5534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5765122175216675,
"step": 115,
"valid_targets_mean": 3199.2,
"valid_targets_min": 701
},
{
"epoch": 0.19169329073482427,
"grad_norm": 0.8583125214810088,
"learning_rate": 1.0842824601366744e-05,
"loss": 0.5527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.537767767906189,
"step": 120,
"valid_targets_mean": 2467.8,
"valid_targets_min": 1100
},
{
"epoch": 0.19968051118210864,
"grad_norm": 0.7006043396902825,
"learning_rate": 1.1298405466970387e-05,
"loss": 0.5509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5513736605644226,
"step": 125,
"valid_targets_mean": 3579.0,
"valid_targets_min": 1342
},
{
"epoch": 0.20766773162939298,
"grad_norm": 0.766820394134251,
"learning_rate": 1.1753986332574032e-05,
"loss": 0.5702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5789293050765991,
"step": 130,
"valid_targets_mean": 2847.6,
"valid_targets_min": 1180
},
{
"epoch": 0.21565495207667731,
"grad_norm": 1.5002638242695263,
"learning_rate": 1.2209567198177677e-05,
"loss": 0.5899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6096343398094177,
"step": 135,
"valid_targets_mean": 2303.8,
"valid_targets_min": 866
},
{
"epoch": 0.22364217252396165,
"grad_norm": 0.7423434999018708,
"learning_rate": 1.2665148063781323e-05,
"loss": 0.5697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5750610828399658,
"step": 140,
"valid_targets_mean": 3315.2,
"valid_targets_min": 1237
},
{
"epoch": 0.23162939297124602,
"grad_norm": 0.8496784328818882,
"learning_rate": 1.3120728929384968e-05,
"loss": 0.5676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5569379329681396,
"step": 145,
"valid_targets_mean": 2489.4,
"valid_targets_min": 1083
},
{
"epoch": 0.23961661341853036,
"grad_norm": 0.7627769903145462,
"learning_rate": 1.357630979498861e-05,
"loss": 0.5495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5773597955703735,
"step": 150,
"valid_targets_mean": 3161.5,
"valid_targets_min": 1192
},
{
"epoch": 0.2476038338658147,
"grad_norm": 0.8821586946530701,
"learning_rate": 1.4031890660592255e-05,
"loss": 0.5394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5083107948303223,
"step": 155,
"valid_targets_mean": 2946.1,
"valid_targets_min": 787
},
{
"epoch": 0.25559105431309903,
"grad_norm": 0.909958221284572,
"learning_rate": 1.4487471526195902e-05,
"loss": 0.5419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5862777233123779,
"step": 160,
"valid_targets_mean": 2436.4,
"valid_targets_min": 1083
},
{
"epoch": 0.26357827476038337,
"grad_norm": 0.854377313552898,
"learning_rate": 1.4943052391799546e-05,
"loss": 0.5346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5437299609184265,
"step": 165,
"valid_targets_mean": 2534.8,
"valid_targets_min": 810
},
{
"epoch": 0.2715654952076677,
"grad_norm": 0.9103282941916306,
"learning_rate": 1.539863325740319e-05,
"loss": 0.5074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4946935474872589,
"step": 170,
"valid_targets_mean": 2139.8,
"valid_targets_min": 1156
},
{
"epoch": 0.2795527156549521,
"grad_norm": 0.88133799748646,
"learning_rate": 1.5854214123006836e-05,
"loss": 0.5215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5952520370483398,
"step": 175,
"valid_targets_mean": 2498.9,
"valid_targets_min": 957
},
{
"epoch": 0.28753993610223644,
"grad_norm": 0.6850615122575533,
"learning_rate": 1.630979498861048e-05,
"loss": 0.5123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4720776677131653,
"step": 180,
"valid_targets_mean": 3554.1,
"valid_targets_min": 1052
},
{
"epoch": 0.2955271565495208,
"grad_norm": 0.8550204357494533,
"learning_rate": 1.6765375854214125e-05,
"loss": 0.5473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5485037565231323,
"step": 185,
"valid_targets_mean": 2786.8,
"valid_targets_min": 948
},
{
"epoch": 0.3035143769968051,
"grad_norm": 0.8206472164048848,
"learning_rate": 1.722095671981777e-05,
"loss": 0.5584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5042972564697266,
"step": 190,
"valid_targets_mean": 2728.0,
"valid_targets_min": 712
},
{
"epoch": 0.31150159744408945,
"grad_norm": 0.6728094856065869,
"learning_rate": 1.7676537585421415e-05,
"loss": 0.5269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5326317548751831,
"step": 195,
"valid_targets_mean": 3720.7,
"valid_targets_min": 1523
},
{
"epoch": 0.3194888178913738,
"grad_norm": 0.7728618092725199,
"learning_rate": 1.813211845102506e-05,
"loss": 0.5197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4793850779533386,
"step": 200,
"valid_targets_mean": 2741.7,
"valid_targets_min": 861
},
{
"epoch": 0.3274760383386581,
"grad_norm": 0.7801842035185508,
"learning_rate": 1.8587699316628704e-05,
"loss": 0.518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5253409147262573,
"step": 205,
"valid_targets_mean": 2814.8,
"valid_targets_min": 861
},
{
"epoch": 0.3354632587859425,
"grad_norm": 0.9863154154066794,
"learning_rate": 1.904328018223235e-05,
"loss": 0.5542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6215020418167114,
"step": 210,
"valid_targets_mean": 2646.8,
"valid_targets_min": 955
},
{
"epoch": 0.34345047923322686,
"grad_norm": 0.7331588617100306,
"learning_rate": 1.9498861047835993e-05,
"loss": 0.5255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4908156096935272,
"step": 215,
"valid_targets_mean": 3356.9,
"valid_targets_min": 1352
},
{
"epoch": 0.3514376996805112,
"grad_norm": 0.8791842141556658,
"learning_rate": 1.9954441913439638e-05,
"loss": 0.5239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5295369625091553,
"step": 220,
"valid_targets_mean": 2351.9,
"valid_targets_min": 1185
},
{
"epoch": 0.35942492012779553,
"grad_norm": 0.7787307287825401,
"learning_rate": 2.0410022779043283e-05,
"loss": 0.4988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48588457703590393,
"step": 225,
"valid_targets_mean": 2535.1,
"valid_targets_min": 1259
},
{
"epoch": 0.36741214057507987,
"grad_norm": 0.8556036439676711,
"learning_rate": 2.0865603644646927e-05,
"loss": 0.5863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6629254817962646,
"step": 230,
"valid_targets_mean": 2723.0,
"valid_targets_min": 1005
},
{
"epoch": 0.3753993610223642,
"grad_norm": 0.8057536275212785,
"learning_rate": 2.1321184510250572e-05,
"loss": 0.5399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6240401864051819,
"step": 235,
"valid_targets_mean": 2943.8,
"valid_targets_min": 1330
},
{
"epoch": 0.38338658146964855,
"grad_norm": 0.9850495934806481,
"learning_rate": 2.1776765375854217e-05,
"loss": 0.5133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49222493171691895,
"step": 240,
"valid_targets_mean": 1964.6,
"valid_targets_min": 946
},
{
"epoch": 0.3913738019169329,
"grad_norm": 0.8186455781999009,
"learning_rate": 2.223234624145786e-05,
"loss": 0.5153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5153531432151794,
"step": 245,
"valid_targets_mean": 2717.8,
"valid_targets_min": 1133
},
{
"epoch": 0.3993610223642173,
"grad_norm": 1.9660992396620858,
"learning_rate": 2.2687927107061506e-05,
"loss": 0.5278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5080440044403076,
"step": 250,
"valid_targets_mean": 3080.2,
"valid_targets_min": 1306
},
{
"epoch": 0.4073482428115016,
"grad_norm": 0.6777855096046905,
"learning_rate": 2.314350797266515e-05,
"loss": 0.5092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45302075147628784,
"step": 255,
"valid_targets_mean": 3767.1,
"valid_targets_min": 1306
},
{
"epoch": 0.41533546325878595,
"grad_norm": 0.8427065918822899,
"learning_rate": 2.3599088838268792e-05,
"loss": 0.4911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5029305219650269,
"step": 260,
"valid_targets_mean": 2818.7,
"valid_targets_min": 1464
},
{
"epoch": 0.4233226837060703,
"grad_norm": 0.7968222858710973,
"learning_rate": 2.4054669703872436e-05,
"loss": 0.5159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5117211937904358,
"step": 265,
"valid_targets_mean": 2781.1,
"valid_targets_min": 1213
},
{
"epoch": 0.43130990415335463,
"grad_norm": 0.8271573611997252,
"learning_rate": 2.4510250569476085e-05,
"loss": 0.5422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4576948583126068,
"step": 270,
"valid_targets_mean": 2558.8,
"valid_targets_min": 1229
},
{
"epoch": 0.43929712460063897,
"grad_norm": 0.7901461972408579,
"learning_rate": 2.496583143507973e-05,
"loss": 0.4954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49033161997795105,
"step": 275,
"valid_targets_mean": 3283.5,
"valid_targets_min": 871
},
{
"epoch": 0.4472843450479233,
"grad_norm": 0.8814296735699261,
"learning_rate": 2.5421412300683374e-05,
"loss": 0.4931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5419114828109741,
"step": 280,
"valid_targets_mean": 2600.2,
"valid_targets_min": 497
},
{
"epoch": 0.45527156549520764,
"grad_norm": 0.8843077229773383,
"learning_rate": 2.587699316628702e-05,
"loss": 0.4964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5407685041427612,
"step": 285,
"valid_targets_mean": 2370.4,
"valid_targets_min": 901
},
{
"epoch": 0.46325878594249204,
"grad_norm": 1.0771357872311227,
"learning_rate": 2.6332574031890663e-05,
"loss": 0.5295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6103911995887756,
"step": 290,
"valid_targets_mean": 2440.1,
"valid_targets_min": 1380
},
{
"epoch": 0.4712460063897764,
"grad_norm": 0.7179319622664404,
"learning_rate": 2.6788154897494308e-05,
"loss": 0.4741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4417612552642822,
"step": 295,
"valid_targets_mean": 3418.1,
"valid_targets_min": 1392
},
{
"epoch": 0.4792332268370607,
"grad_norm": 0.714979713777273,
"learning_rate": 2.7243735763097953e-05,
"loss": 0.5061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44420793652534485,
"step": 300,
"valid_targets_mean": 3550.5,
"valid_targets_min": 1539
},
{
"epoch": 0.48722044728434505,
"grad_norm": 0.832676511155696,
"learning_rate": 2.7699316628701597e-05,
"loss": 0.49,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5182697772979736,
"step": 305,
"valid_targets_mean": 2901.4,
"valid_targets_min": 1270
},
{
"epoch": 0.4952076677316294,
"grad_norm": 1.2011451937543158,
"learning_rate": 2.815489749430524e-05,
"loss": 0.5109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5339452624320984,
"step": 310,
"valid_targets_mean": 3127.3,
"valid_targets_min": 1080
},
{
"epoch": 0.5031948881789138,
"grad_norm": 1.1011304858781235,
"learning_rate": 2.8610478359908883e-05,
"loss": 0.489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4957484304904938,
"step": 315,
"valid_targets_mean": 2123.2,
"valid_targets_min": 960
},
{
"epoch": 0.5111821086261981,
"grad_norm": 0.7518434901268846,
"learning_rate": 2.906605922551253e-05,
"loss": 0.4972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5477015972137451,
"step": 320,
"valid_targets_mean": 3466.9,
"valid_targets_min": 1186
},
{
"epoch": 0.5191693290734825,
"grad_norm": 0.818548220458573,
"learning_rate": 2.9521640091116176e-05,
"loss": 0.5047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4946255087852478,
"step": 325,
"valid_targets_mean": 2968.8,
"valid_targets_min": 873
},
{
"epoch": 0.5271565495207667,
"grad_norm": 0.9354909961997221,
"learning_rate": 2.997722095671982e-05,
"loss": 0.4983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5147006511688232,
"step": 330,
"valid_targets_mean": 2093.4,
"valid_targets_min": 811
},
{
"epoch": 0.5351437699680511,
"grad_norm": 0.8861773466418632,
"learning_rate": 3.0432801822323465e-05,
"loss": 0.5012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5008596777915955,
"step": 335,
"valid_targets_mean": 3097.7,
"valid_targets_min": 921
},
{
"epoch": 0.5431309904153354,
"grad_norm": 0.7688169713732055,
"learning_rate": 3.088838268792711e-05,
"loss": 0.5055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.496390700340271,
"step": 340,
"valid_targets_mean": 3200.6,
"valid_targets_min": 1282
},
{
"epoch": 0.5511182108626198,
"grad_norm": 0.8113792447780495,
"learning_rate": 3.1343963553530755e-05,
"loss": 0.5209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5141535997390747,
"step": 345,
"valid_targets_mean": 2751.6,
"valid_targets_min": 1031
},
{
"epoch": 0.5591054313099042,
"grad_norm": 2.1321863058940393,
"learning_rate": 3.17995444191344e-05,
"loss": 0.4779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5301027297973633,
"step": 350,
"valid_targets_mean": 2933.4,
"valid_targets_min": 1160
},
{
"epoch": 0.5670926517571885,
"grad_norm": 0.6806494335642181,
"learning_rate": 3.2255125284738044e-05,
"loss": 0.4775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.506610095500946,
"step": 355,
"valid_targets_mean": 3795.7,
"valid_targets_min": 1294
},
{
"epoch": 0.5750798722044729,
"grad_norm": 0.8467603882079074,
"learning_rate": 3.271070615034169e-05,
"loss": 0.4982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4562826156616211,
"step": 360,
"valid_targets_mean": 2606.6,
"valid_targets_min": 981
},
{
"epoch": 0.5830670926517572,
"grad_norm": 0.8022847528326496,
"learning_rate": 3.316628701594533e-05,
"loss": 0.5121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.531557559967041,
"step": 365,
"valid_targets_mean": 2998.2,
"valid_targets_min": 1473
},
{
"epoch": 0.5910543130990416,
"grad_norm": 0.8556604547740909,
"learning_rate": 3.362186788154898e-05,
"loss": 0.4987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5079728364944458,
"step": 370,
"valid_targets_mean": 2428.6,
"valid_targets_min": 892
},
{
"epoch": 0.5990415335463258,
"grad_norm": 0.7394590411511266,
"learning_rate": 3.407744874715262e-05,
"loss": 0.4861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4963635206222534,
"step": 375,
"valid_targets_mean": 3267.9,
"valid_targets_min": 1407
},
{
"epoch": 0.6070287539936102,
"grad_norm": 0.6521727148571741,
"learning_rate": 3.453302961275627e-05,
"loss": 0.5189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48329901695251465,
"step": 380,
"valid_targets_mean": 3911.4,
"valid_targets_min": 849
},
{
"epoch": 0.6150159744408946,
"grad_norm": 0.8229679295931809,
"learning_rate": 3.498861047835991e-05,
"loss": 0.4934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4811190366744995,
"step": 385,
"valid_targets_mean": 2285.9,
"valid_targets_min": 826
},
{
"epoch": 0.6230031948881789,
"grad_norm": 0.9071810840956518,
"learning_rate": 3.5444191343963557e-05,
"loss": 0.4721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4603239893913269,
"step": 390,
"valid_targets_mean": 2446.5,
"valid_targets_min": 1318
},
{
"epoch": 0.6309904153354633,
"grad_norm": 0.8673398873329051,
"learning_rate": 3.58997722095672e-05,
"loss": 0.4829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5173234939575195,
"step": 395,
"valid_targets_mean": 2453.8,
"valid_targets_min": 969
},
{
"epoch": 0.6389776357827476,
"grad_norm": 0.7684733433083464,
"learning_rate": 3.6355353075170846e-05,
"loss": 0.5033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5281765460968018,
"step": 400,
"valid_targets_mean": 2919.4,
"valid_targets_min": 920
},
{
"epoch": 0.646964856230032,
"grad_norm": 0.8185705410175095,
"learning_rate": 3.681093394077449e-05,
"loss": 0.4779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4623745083808899,
"step": 405,
"valid_targets_mean": 2701.0,
"valid_targets_min": 1169
},
{
"epoch": 0.6549520766773163,
"grad_norm": 0.7773039011766039,
"learning_rate": 3.7266514806378135e-05,
"loss": 0.46,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.486310213804245,
"step": 410,
"valid_targets_mean": 2514.9,
"valid_targets_min": 970
},
{
"epoch": 0.6629392971246006,
"grad_norm": 0.737226072296739,
"learning_rate": 3.772209567198178e-05,
"loss": 0.4686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4548845589160919,
"step": 415,
"valid_targets_mean": 3062.8,
"valid_targets_min": 1112
},
{
"epoch": 0.670926517571885,
"grad_norm": 0.8207102057499368,
"learning_rate": 3.8177676537585425e-05,
"loss": 0.5013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5302478075027466,
"step": 420,
"valid_targets_mean": 2693.4,
"valid_targets_min": 913
},
{
"epoch": 0.6789137380191693,
"grad_norm": 0.8145687731562341,
"learning_rate": 3.863325740318907e-05,
"loss": 0.5151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5070667266845703,
"step": 425,
"valid_targets_mean": 2775.8,
"valid_targets_min": 1168
},
{
"epoch": 0.6869009584664537,
"grad_norm": 0.8111716683915323,
"learning_rate": 3.9088838268792714e-05,
"loss": 0.4944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4909268915653229,
"step": 430,
"valid_targets_mean": 2921.1,
"valid_targets_min": 1126
},
{
"epoch": 0.694888178913738,
"grad_norm": 0.7411546696567747,
"learning_rate": 3.954441913439636e-05,
"loss": 0.4783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4458876848220825,
"step": 435,
"valid_targets_mean": 3290.1,
"valid_targets_min": 1084
},
{
"epoch": 0.7028753993610224,
"grad_norm": 0.7518470194155535,
"learning_rate": 4e-05,
"loss": 0.4812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4502463638782501,
"step": 440,
"valid_targets_mean": 2823.3,
"valid_targets_min": 1108
},
{
"epoch": 0.7108626198083067,
"grad_norm": 0.7640155259479486,
"learning_rate": 3.999984129682125e-05,
"loss": 0.4932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46215182542800903,
"step": 445,
"valid_targets_mean": 2613.8,
"valid_targets_min": 960
},
{
"epoch": 0.7188498402555911,
"grad_norm": 0.7415555019488704,
"learning_rate": 3.9999365189803684e-05,
"loss": 0.4708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4664982557296753,
"step": 450,
"valid_targets_mean": 3100.8,
"valid_targets_min": 1095
},
{
"epoch": 0.7268370607028753,
"grad_norm": 0.802377503314035,
"learning_rate": 3.9998571686503264e-05,
"loss": 0.4866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4585043489933014,
"step": 455,
"valid_targets_mean": 2264.9,
"valid_targets_min": 909
},
{
"epoch": 0.7348242811501597,
"grad_norm": 0.708085049519949,
"learning_rate": 3.9997460799513134e-05,
"loss": 0.4845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5432193279266357,
"step": 460,
"valid_targets_mean": 3839.4,
"valid_targets_min": 873
},
{
"epoch": 0.7428115015974441,
"grad_norm": 0.7879120589505894,
"learning_rate": 3.999603254646343e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46323227882385254,
"step": 465,
"valid_targets_mean": 3269.4,
"valid_targets_min": 1072
},
{
"epoch": 0.7507987220447284,
"grad_norm": 0.749075306348792,
"learning_rate": 3.9994286950020986e-05,
"loss": 0.507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4851936101913452,
"step": 470,
"valid_targets_mean": 3137.9,
"valid_targets_min": 1124
},
{
"epoch": 0.7587859424920128,
"grad_norm": 0.7129540444830214,
"learning_rate": 3.999222403788896e-05,
"loss": 0.4729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4908882975578308,
"step": 475,
"valid_targets_mean": 3526.2,
"valid_targets_min": 1146
},
{
"epoch": 0.7667731629392971,
"grad_norm": 0.73095835831582,
"learning_rate": 3.9989843842806435e-05,
"loss": 0.4863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43629252910614014,
"step": 480,
"valid_targets_mean": 3166.7,
"valid_targets_min": 1356
},
{
"epoch": 0.7747603833865815,
"grad_norm": 0.8481950002243562,
"learning_rate": 3.998714640254786e-05,
"loss": 0.4703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4779198169708252,
"step": 485,
"valid_targets_mean": 2446.2,
"valid_targets_min": 1053
},
{
"epoch": 0.7827476038338658,
"grad_norm": 0.9252979170092325,
"learning_rate": 3.998413175992247e-05,
"loss": 0.4909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4803544878959656,
"step": 490,
"valid_targets_mean": 2121.9,
"valid_targets_min": 1006
},
{
"epoch": 0.7907348242811502,
"grad_norm": 0.9413520178628827,
"learning_rate": 3.99807999627736e-05,
"loss": 0.5062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5145155191421509,
"step": 495,
"valid_targets_mean": 2570.1,
"valid_targets_min": 1079
},
{
"epoch": 0.7987220447284346,
"grad_norm": 0.8048047081738046,
"learning_rate": 3.997715106397794e-05,
"loss": 0.4847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4717975854873657,
"step": 500,
"valid_targets_mean": 2329.3,
"valid_targets_min": 938
},
{
"epoch": 0.8067092651757188,
"grad_norm": 0.7643728322556019,
"learning_rate": 3.997318512144465e-05,
"loss": 0.4873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46637722849845886,
"step": 505,
"valid_targets_mean": 2817.7,
"valid_targets_min": 715
},
{
"epoch": 0.8146964856230032,
"grad_norm": 0.8279624349532135,
"learning_rate": 3.9968902198114516e-05,
"loss": 0.4673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5180720686912537,
"step": 510,
"valid_targets_mean": 2913.6,
"valid_targets_min": 823
},
{
"epoch": 0.8226837060702875,
"grad_norm": 0.8109766155806294,
"learning_rate": 3.996430236195889e-05,
"loss": 0.4805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49160677194595337,
"step": 515,
"valid_targets_mean": 2462.8,
"valid_targets_min": 1046
},
{
"epoch": 0.8306709265175719,
"grad_norm": 0.7956373398673393,
"learning_rate": 3.995938568597864e-05,
"loss": 0.4909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42897269129753113,
"step": 520,
"valid_targets_mean": 2364.6,
"valid_targets_min": 1400
},
{
"epoch": 0.8386581469648562,
"grad_norm": 0.7414841411842699,
"learning_rate": 3.995415224820297e-05,
"loss": 0.4887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5362697839736938,
"step": 525,
"valid_targets_mean": 3108.9,
"valid_targets_min": 1195
},
{
"epoch": 0.8466453674121406,
"grad_norm": 0.8317859182220397,
"learning_rate": 3.994860213168819e-05,
"loss": 0.469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.483562171459198,
"step": 530,
"valid_targets_mean": 2305.6,
"valid_targets_min": 1103
},
{
"epoch": 0.854632587859425,
"grad_norm": 0.8462535217865819,
"learning_rate": 3.9942735424516435e-05,
"loss": 0.4811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4656353294849396,
"step": 535,
"valid_targets_mean": 2399.4,
"valid_targets_min": 613
},
{
"epoch": 0.8626198083067093,
"grad_norm": 0.7834889362197252,
"learning_rate": 3.9936552219794196e-05,
"loss": 0.4826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4877358675003052,
"step": 540,
"valid_targets_mean": 3244.2,
"valid_targets_min": 837
},
{
"epoch": 0.8706070287539937,
"grad_norm": 0.8102216918022214,
"learning_rate": 3.993005261565091e-05,
"loss": 0.4716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4835214614868164,
"step": 545,
"valid_targets_mean": 2657.9,
"valid_targets_min": 895
},
{
"epoch": 0.8785942492012779,
"grad_norm": 0.7484190976431879,
"learning_rate": 3.992323671523735e-05,
"loss": 0.4861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4827854037284851,
"step": 550,
"valid_targets_mean": 2936.5,
"valid_targets_min": 769
},
{
"epoch": 0.8865814696485623,
"grad_norm": 0.8298777988018279,
"learning_rate": 3.991610462672403e-05,
"loss": 0.4842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.509543240070343,
"step": 555,
"valid_targets_mean": 2912.0,
"valid_targets_min": 1159
},
{
"epoch": 0.8945686900958466,
"grad_norm": 0.7034233322649788,
"learning_rate": 3.9908656463299456e-05,
"loss": 0.4695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4778456389904022,
"step": 560,
"valid_targets_mean": 3026.8,
"valid_targets_min": 1167
},
{
"epoch": 0.902555910543131,
"grad_norm": 0.7349295369253303,
"learning_rate": 3.990089234316835e-05,
"loss": 0.4771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42017149925231934,
"step": 565,
"valid_targets_mean": 2561.4,
"valid_targets_min": 1007
},
{
"epoch": 0.9105431309904153,
"grad_norm": 0.8513539946715051,
"learning_rate": 3.989281238954978e-05,
"loss": 0.4812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45802587270736694,
"step": 570,
"valid_targets_mean": 2120.5,
"valid_targets_min": 962
},
{
"epoch": 0.9185303514376997,
"grad_norm": 0.7971530719267699,
"learning_rate": 3.9884416730675155e-05,
"loss": 0.4671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48669928312301636,
"step": 575,
"valid_targets_mean": 3067.6,
"valid_targets_min": 1125
},
{
"epoch": 0.9265175718849841,
"grad_norm": 0.7526750754328368,
"learning_rate": 3.987570549978626e-05,
"loss": 0.4601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4806230962276459,
"step": 580,
"valid_targets_mean": 2587.2,
"valid_targets_min": 1150
},
{
"epoch": 0.9345047923322684,
"grad_norm": 0.8137737946062722,
"learning_rate": 3.986667883513311e-05,
"loss": 0.4563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.518112301826477,
"step": 585,
"valid_targets_mean": 2852.7,
"valid_targets_min": 1193
},
{
"epoch": 0.9424920127795527,
"grad_norm": 0.8659103970463817,
"learning_rate": 3.985733687997173e-05,
"loss": 0.489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5319004058837891,
"step": 590,
"valid_targets_mean": 2343.2,
"valid_targets_min": 1225
},
{
"epoch": 0.950479233226837,
"grad_norm": 0.7469614351703592,
"learning_rate": 3.984767978256192e-05,
"loss": 0.4564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4597756266593933,
"step": 595,
"valid_targets_mean": 2952.0,
"valid_targets_min": 1383
},
{
"epoch": 0.9584664536741214,
"grad_norm": 0.7861886747969548,
"learning_rate": 3.983770769616488e-05,
"loss": 0.4622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4694702923297882,
"step": 600,
"valid_targets_mean": 2704.9,
"valid_targets_min": 855
},
{
"epoch": 0.9664536741214057,
"grad_norm": 0.7149924456313416,
"learning_rate": 3.9827420779040805e-05,
"loss": 0.4772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4691518545150757,
"step": 605,
"valid_targets_mean": 3017.1,
"valid_targets_min": 1070
},
{
"epoch": 0.9744408945686901,
"grad_norm": 0.6590357190461086,
"learning_rate": 3.981681919444633e-05,
"loss": 0.4613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.416545569896698,
"step": 610,
"valid_targets_mean": 3355.1,
"valid_targets_min": 865
},
{
"epoch": 0.9824281150159745,
"grad_norm": 0.7704139751683394,
"learning_rate": 3.980590311063197e-05,
"loss": 0.479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5077451467514038,
"step": 615,
"valid_targets_mean": 2788.4,
"valid_targets_min": 651
},
{
"epoch": 0.9904153354632588,
"grad_norm": 0.738816152478186,
"learning_rate": 3.9794672700839455e-05,
"loss": 0.4779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47935396432876587,
"step": 620,
"valid_targets_mean": 2682.5,
"valid_targets_min": 1006
},
{
"epoch": 0.9984025559105432,
"grad_norm": 0.7573465905776805,
"learning_rate": 3.9783128143298945e-05,
"loss": 0.4591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5034106969833374,
"step": 625,
"valid_targets_mean": 2697.0,
"valid_targets_min": 878
},
{
"epoch": 1.0063897763578276,
"grad_norm": 0.7685082899437944,
"learning_rate": 3.977126962122625e-05,
"loss": 0.4473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4544332027435303,
"step": 630,
"valid_targets_mean": 2484.2,
"valid_targets_min": 1257
},
{
"epoch": 1.0143769968051117,
"grad_norm": 0.7630287431391214,
"learning_rate": 3.975909732281988e-05,
"loss": 0.4815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5001740455627441,
"step": 635,
"valid_targets_mean": 2804.8,
"valid_targets_min": 1111
},
{
"epoch": 1.0223642172523961,
"grad_norm": 0.8349889620121833,
"learning_rate": 3.974661144125808e-05,
"loss": 0.4379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44968223571777344,
"step": 640,
"valid_targets_mean": 2246.1,
"valid_targets_min": 934
},
{
"epoch": 1.0303514376996805,
"grad_norm": 0.7289354674087208,
"learning_rate": 3.973381217469576e-05,
"loss": 0.4177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39167508482933044,
"step": 645,
"valid_targets_mean": 2778.6,
"valid_targets_min": 1312
},
{
"epoch": 1.038338658146965,
"grad_norm": 0.7610454326773037,
"learning_rate": 3.972069972626135e-05,
"loss": 0.4489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4945276379585266,
"step": 650,
"valid_targets_mean": 2881.5,
"valid_targets_min": 1154
},
{
"epoch": 1.0463258785942493,
"grad_norm": 0.7529804157949619,
"learning_rate": 3.970727430405357e-05,
"loss": 0.4461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4402261972427368,
"step": 655,
"valid_targets_mean": 3169.2,
"valid_targets_min": 881
},
{
"epoch": 1.0543130990415335,
"grad_norm": 0.7479368522385385,
"learning_rate": 3.969353612113815e-05,
"loss": 0.4171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45113587379455566,
"step": 660,
"valid_targets_mean": 2818.9,
"valid_targets_min": 904
},
{
"epoch": 1.0623003194888179,
"grad_norm": 0.7429987740189701,
"learning_rate": 3.96794853955444e-05,
"loss": 0.4416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3951209783554077,
"step": 665,
"valid_targets_mean": 2721.9,
"valid_targets_min": 855
},
{
"epoch": 1.0702875399361023,
"grad_norm": 0.6988528547787896,
"learning_rate": 3.966512235026182e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44669538736343384,
"step": 670,
"valid_targets_mean": 3886.9,
"valid_targets_min": 970
},
{
"epoch": 1.0782747603833867,
"grad_norm": 0.7685049413282936,
"learning_rate": 3.96504472132365e-05,
"loss": 0.4628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46493786573410034,
"step": 675,
"valid_targets_mean": 2864.7,
"valid_targets_min": 912
},
{
"epoch": 1.0862619808306708,
"grad_norm": 0.7321617108406029,
"learning_rate": 3.9635460217367513e-05,
"loss": 0.4508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41404807567596436,
"step": 680,
"valid_targets_mean": 2885.9,
"valid_targets_min": 1079
},
{
"epoch": 1.0942492012779552,
"grad_norm": 0.7592802978135224,
"learning_rate": 3.962016160050327e-05,
"loss": 0.4482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41572150588035583,
"step": 685,
"valid_targets_mean": 2479.6,
"valid_targets_min": 913
},
{
"epoch": 1.1022364217252396,
"grad_norm": 0.732817568596785,
"learning_rate": 3.960455160543767e-05,
"loss": 0.4626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42624184489250183,
"step": 690,
"valid_targets_mean": 2974.9,
"valid_targets_min": 928
},
{
"epoch": 1.110223642172524,
"grad_norm": 0.76011633776547,
"learning_rate": 3.958863047990631e-05,
"loss": 0.4283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43110883235931396,
"step": 695,
"valid_targets_mean": 2901.8,
"valid_targets_min": 938
},
{
"epoch": 1.1182108626198084,
"grad_norm": 0.8431475807189021,
"learning_rate": 3.95723984765825e-05,
"loss": 0.4612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5132505893707275,
"step": 700,
"valid_targets_mean": 2484.8,
"valid_targets_min": 1412
},
{
"epoch": 1.1261980830670926,
"grad_norm": 0.9220223660266152,
"learning_rate": 3.955585585307329e-05,
"loss": 0.46,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44615116715431213,
"step": 705,
"valid_targets_mean": 2291.6,
"valid_targets_min": 884
},
{
"epoch": 1.134185303514377,
"grad_norm": 1.019334003630654,
"learning_rate": 3.9539002871915395e-05,
"loss": 0.4542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43944239616394043,
"step": 710,
"valid_targets_mean": 2567.4,
"valid_targets_min": 1308
},
{
"epoch": 1.1421725239616614,
"grad_norm": 0.7795615708622041,
"learning_rate": 3.952183980057096e-05,
"loss": 0.4325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4104035496711731,
"step": 715,
"valid_targets_mean": 2444.2,
"valid_targets_min": 803
},
{
"epoch": 1.1501597444089458,
"grad_norm": 0.8468623107296779,
"learning_rate": 3.950436691142339e-05,
"loss": 0.4401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43115919828414917,
"step": 720,
"valid_targets_mean": 2466.9,
"valid_targets_min": 1406
},
{
"epoch": 1.15814696485623,
"grad_norm": 0.8529964274281423,
"learning_rate": 3.948658448177299e-05,
"loss": 0.4524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48739194869995117,
"step": 725,
"valid_targets_mean": 2443.1,
"valid_targets_min": 1168
},
{
"epoch": 1.1661341853035143,
"grad_norm": 0.7172046757160037,
"learning_rate": 3.946849279383258e-05,
"loss": 0.4257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3758084774017334,
"step": 730,
"valid_targets_mean": 2842.2,
"valid_targets_min": 1077
},
{
"epoch": 1.1741214057507987,
"grad_norm": 0.711565411890527,
"learning_rate": 3.9450092134722984e-05,
"loss": 0.4377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4145118296146393,
"step": 735,
"valid_targets_mean": 3007.6,
"valid_targets_min": 507
},
{
"epoch": 1.182108626198083,
"grad_norm": 0.8309877125516639,
"learning_rate": 3.943138279646853e-05,
"loss": 0.4421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46872472763061523,
"step": 740,
"valid_targets_mean": 2660.7,
"valid_targets_min": 818
},
{
"epoch": 1.1900958466453675,
"grad_norm": 0.8195558428978243,
"learning_rate": 3.941236507599234e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4253050982952118,
"step": 745,
"valid_targets_mean": 2162.1,
"valid_targets_min": 877
},
{
"epoch": 1.1980830670926517,
"grad_norm": 0.7757463661583209,
"learning_rate": 3.93930392751117e-05,
"loss": 0.4283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41354313492774963,
"step": 750,
"valid_targets_mean": 2641.2,
"valid_targets_min": 1158
},
{
"epoch": 1.206070287539936,
"grad_norm": 0.8685777071160953,
"learning_rate": 3.9373405700533204e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4196351170539856,
"step": 755,
"valid_targets_mean": 2522.3,
"valid_targets_min": 733
},
{
"epoch": 1.2140575079872205,
"grad_norm": 0.7508846483862592,
"learning_rate": 3.935346466384793e-05,
"loss": 0.4199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44403281807899475,
"step": 760,
"valid_targets_mean": 3216.3,
"valid_targets_min": 1101
},
{
"epoch": 1.2220447284345048,
"grad_norm": 0.758240824860655,
"learning_rate": 3.933321648152646e-05,
"loss": 0.4384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4567496180534363,
"step": 765,
"valid_targets_mean": 2950.4,
"valid_targets_min": 1193
},
{
"epoch": 1.230031948881789,
"grad_norm": 0.7200839121536595,
"learning_rate": 3.931266147491389e-05,
"loss": 0.4516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4802227020263672,
"step": 770,
"valid_targets_mean": 3282.1,
"valid_targets_min": 1203
},
{
"epoch": 1.2380191693290734,
"grad_norm": 0.6572973431050214,
"learning_rate": 3.929179997022471e-05,
"loss": 0.4278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39114686846733093,
"step": 775,
"valid_targets_mean": 3843.3,
"valid_targets_min": 992
},
{
"epoch": 1.2460063897763578,
"grad_norm": 0.6844582042432027,
"learning_rate": 3.927063229853763e-05,
"loss": 0.4535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4484739303588867,
"step": 780,
"valid_targets_mean": 3771.4,
"valid_targets_min": 1028
},
{
"epoch": 1.2539936102236422,
"grad_norm": 0.7829452545267517,
"learning_rate": 3.9249158795790316e-05,
"loss": 0.4315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4051206707954407,
"step": 785,
"valid_targets_mean": 2456.8,
"valid_targets_min": 764
},
{
"epoch": 1.2619808306709266,
"grad_norm": 0.8420722089855658,
"learning_rate": 3.9227379802774106e-05,
"loss": 0.4634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4935472011566162,
"step": 790,
"valid_targets_mean": 2295.8,
"valid_targets_min": 816
},
{
"epoch": 1.269968051118211,
"grad_norm": 0.7215521455732657,
"learning_rate": 3.920529566512852e-05,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4593965709209442,
"step": 795,
"valid_targets_mean": 3036.1,
"valid_targets_min": 1362
},
{
"epoch": 1.2779552715654952,
"grad_norm": 0.6783023396300084,
"learning_rate": 3.918290673333585e-05,
"loss": 0.437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4560937285423279,
"step": 800,
"valid_targets_mean": 3412.9,
"valid_targets_min": 893
},
{
"epoch": 1.2859424920127795,
"grad_norm": 0.8802145850392343,
"learning_rate": 3.916021336271556e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42020413279533386,
"step": 805,
"valid_targets_mean": 2170.1,
"valid_targets_min": 722
},
{
"epoch": 1.293929712460064,
"grad_norm": 0.8120285437652148,
"learning_rate": 3.913721591341867e-05,
"loss": 0.4176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41880103945732117,
"step": 810,
"valid_targets_mean": 2954.5,
"valid_targets_min": 1212
},
{
"epoch": 1.3019169329073481,
"grad_norm": 0.8288104538653214,
"learning_rate": 3.9113914750421985e-05,
"loss": 0.4255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41077354550361633,
"step": 815,
"valid_targets_mean": 2509.9,
"valid_targets_min": 1417
},
{
"epoch": 1.3099041533546325,
"grad_norm": 0.8618512146438632,
"learning_rate": 3.9090310243522394e-05,
"loss": 0.4259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44943004846572876,
"step": 820,
"valid_targets_mean": 2502.8,
"valid_targets_min": 1461
},
{
"epoch": 1.317891373801917,
"grad_norm": 0.7760318158209316,
"learning_rate": 3.90664027673309e-05,
"loss": 0.4501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4216914772987366,
"step": 825,
"valid_targets_mean": 2769.1,
"valid_targets_min": 1289
},
{
"epoch": 1.3258785942492013,
"grad_norm": 0.6906923363443747,
"learning_rate": 3.904219270126677e-05,
"loss": 0.4191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.415194571018219,
"step": 830,
"valid_targets_mean": 3361.9,
"valid_targets_min": 1049
},
{
"epoch": 1.3338658146964857,
"grad_norm": 0.8174353322181585,
"learning_rate": 3.901768042955144e-05,
"loss": 0.4324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45407986640930176,
"step": 835,
"valid_targets_mean": 2556.1,
"valid_targets_min": 1003
},
{
"epoch": 1.34185303514377,
"grad_norm": 0.7692657856870714,
"learning_rate": 3.8992866341202446e-05,
"loss": 0.4124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.393581748008728,
"step": 840,
"valid_targets_mean": 2292.6,
"valid_targets_min": 981
},
{
"epoch": 1.3498402555910542,
"grad_norm": 0.7721910677108021,
"learning_rate": 3.8967750830027277e-05,
"loss": 0.4225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43121227622032166,
"step": 845,
"valid_targets_mean": 2591.4,
"valid_targets_min": 1106
},
{
"epoch": 1.3578274760383386,
"grad_norm": 0.7607761762713008,
"learning_rate": 3.894233429461706e-05,
"loss": 0.4357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45984774827957153,
"step": 850,
"valid_targets_mean": 2971.3,
"valid_targets_min": 1249
},
{
"epoch": 1.365814696485623,
"grad_norm": 0.7549358056556162,
"learning_rate": 3.89166171383403e-05,
"loss": 0.4134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4264622926712036,
"step": 855,
"valid_targets_mean": 2585.4,
"valid_targets_min": 1483
},
{
"epoch": 1.3738019169329074,
"grad_norm": 0.721426310472384,
"learning_rate": 3.889059976933644e-05,
"loss": 0.4258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4268583059310913,
"step": 860,
"valid_targets_mean": 2885.3,
"valid_targets_min": 1173
},
{
"epoch": 1.3817891373801916,
"grad_norm": 0.7720799009636946,
"learning_rate": 3.88642826005094e-05,
"loss": 0.4505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42852962017059326,
"step": 865,
"valid_targets_mean": 2731.6,
"valid_targets_min": 871
},
{
"epoch": 1.389776357827476,
"grad_norm": 0.8470631851658071,
"learning_rate": 3.883766604952102e-05,
"loss": 0.4547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49135443568229675,
"step": 870,
"valid_targets_mean": 2234.6,
"valid_targets_min": 999
},
{
"epoch": 1.3977635782747604,
"grad_norm": 0.7411779868421573,
"learning_rate": 3.8810750538784404e-05,
"loss": 0.4435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4041995406150818,
"step": 875,
"valid_targets_mean": 2670.5,
"valid_targets_min": 1122
},
{
"epoch": 1.4057507987220448,
"grad_norm": 0.7140299672524761,
"learning_rate": 3.878353649545728e-05,
"loss": 0.4402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.435030996799469,
"step": 880,
"valid_targets_mean": 3004.1,
"valid_targets_min": 1197
},
{
"epoch": 1.4137380191693292,
"grad_norm": 0.7923681119897052,
"learning_rate": 3.875602435143517e-05,
"loss": 0.4411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3961261510848999,
"step": 885,
"valid_targets_mean": 2766.9,
"valid_targets_min": 862
},
{
"epoch": 1.4217252396166133,
"grad_norm": 0.7705589230089058,
"learning_rate": 3.872821454334453e-05,
"loss": 0.4351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4006156921386719,
"step": 890,
"valid_targets_mean": 2416.2,
"valid_targets_min": 1003
},
{
"epoch": 1.4297124600638977,
"grad_norm": 0.6925517039660947,
"learning_rate": 3.870010751253587e-05,
"loss": 0.4377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4088160991668701,
"step": 895,
"valid_targets_mean": 3179.1,
"valid_targets_min": 763
},
{
"epoch": 1.4376996805111821,
"grad_norm": 0.8307106887932786,
"learning_rate": 3.867170370507668e-05,
"loss": 0.4581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4864905774593353,
"step": 900,
"valid_targets_mean": 2541.1,
"valid_targets_min": 778
},
{
"epoch": 1.4456869009584665,
"grad_norm": 0.9623816866236481,
"learning_rate": 3.8643003571744445e-05,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4354180693626404,
"step": 905,
"valid_targets_mean": 2225.6,
"valid_targets_min": 1063
},
{
"epoch": 1.4536741214057507,
"grad_norm": 0.7716245831699764,
"learning_rate": 3.861400756801938e-05,
"loss": 0.4606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4495222568511963,
"step": 910,
"valid_targets_mean": 3027.4,
"valid_targets_min": 919
},
{
"epoch": 1.461661341853035,
"grad_norm": 0.7484846052853862,
"learning_rate": 3.8584716154077286e-05,
"loss": 0.4305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4441258907318115,
"step": 915,
"valid_targets_mean": 3202.1,
"valid_targets_min": 1124
},
{
"epoch": 1.4696485623003195,
"grad_norm": 0.7368859538362733,
"learning_rate": 3.855512979478222e-05,
"loss": 0.4252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3749830722808838,
"step": 920,
"valid_targets_mean": 2625.4,
"valid_targets_min": 1193
},
{
"epoch": 1.4776357827476039,
"grad_norm": 0.6049367824225332,
"learning_rate": 3.852524895967911e-05,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38308608531951904,
"step": 925,
"valid_targets_mean": 4036.0,
"valid_targets_min": 1111
},
{
"epoch": 1.4856230031948883,
"grad_norm": 0.7427843372018998,
"learning_rate": 3.8495074122986296e-05,
"loss": 0.4265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4193194806575775,
"step": 930,
"valid_targets_mean": 2806.4,
"valid_targets_min": 789
},
{
"epoch": 1.4936102236421724,
"grad_norm": 0.679197562951001,
"learning_rate": 3.846460576358804e-05,
"loss": 0.4365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44789695739746094,
"step": 935,
"valid_targets_mean": 3683.1,
"valid_targets_min": 1532
},
{
"epoch": 1.5015974440894568,
"grad_norm": 0.6722746741760623,
"learning_rate": 3.843384436502688e-05,
"loss": 0.4293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4009643793106079,
"step": 940,
"valid_targets_mean": 3287.3,
"valid_targets_min": 1028
},
{
"epoch": 1.5095846645367412,
"grad_norm": 0.7368258927731269,
"learning_rate": 3.8402790415496e-05,
"loss": 0.4549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43784040212631226,
"step": 945,
"valid_targets_mean": 2733.6,
"valid_targets_min": 1148
},
{
"epoch": 1.5175718849840254,
"grad_norm": 0.7152894771456657,
"learning_rate": 3.837144440783144e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44536614418029785,
"step": 950,
"valid_targets_mean": 3164.2,
"valid_targets_min": 1067
},
{
"epoch": 1.5255591054313098,
"grad_norm": 0.7947534576481916,
"learning_rate": 3.833980683950431e-05,
"loss": 0.4814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4934665858745575,
"step": 955,
"valid_targets_mean": 2351.3,
"valid_targets_min": 651
},
{
"epoch": 1.5335463258785942,
"grad_norm": 0.7875282517828147,
"learning_rate": 3.8307878212612886e-05,
"loss": 0.4418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43938589096069336,
"step": 960,
"valid_targets_mean": 2303.6,
"valid_targets_min": 1131
},
{
"epoch": 1.5415335463258786,
"grad_norm": 0.5923903169412785,
"learning_rate": 3.827565903387461e-05,
"loss": 0.4374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41518276929855347,
"step": 965,
"valid_targets_mean": 4034.9,
"valid_targets_min": 1231
},
{
"epoch": 1.549520766773163,
"grad_norm": 0.8910911155444613,
"learning_rate": 3.82431498146181e-05,
"loss": 0.4357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4936522841453552,
"step": 970,
"valid_targets_mean": 2327.3,
"valid_targets_min": 834
},
{
"epoch": 1.5575079872204474,
"grad_norm": 0.6459335309997667,
"learning_rate": 3.821035107077499e-05,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41498053073883057,
"step": 975,
"valid_targets_mean": 3341.9,
"valid_targets_min": 1006
},
{
"epoch": 1.5654952076677318,
"grad_norm": 0.6926152294260767,
"learning_rate": 3.817726332287179e-05,
"loss": 0.4259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4034827947616577,
"step": 980,
"valid_targets_mean": 3087.4,
"valid_targets_min": 1153
},
{
"epoch": 1.573482428115016,
"grad_norm": 0.8034994479627938,
"learning_rate": 3.814388709602155e-05,
"loss": 0.4412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43312889337539673,
"step": 985,
"valid_targets_mean": 2240.4,
"valid_targets_min": 1043
},
{
"epoch": 1.5814696485623003,
"grad_norm": 0.7989642353413773,
"learning_rate": 3.8110222919915626e-05,
"loss": 0.4381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4340096414089203,
"step": 990,
"valid_targets_mean": 2381.8,
"valid_targets_min": 791
},
{
"epoch": 1.5894568690095847,
"grad_norm": 0.6447498747286449,
"learning_rate": 3.8076271328815175e-05,
"loss": 0.4441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42020028829574585,
"step": 995,
"valid_targets_mean": 3908.2,
"valid_targets_min": 1254
},
{
"epoch": 1.5974440894568689,
"grad_norm": 0.6380365159848356,
"learning_rate": 3.804203286154275e-05,
"loss": 0.4065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4114200472831726,
"step": 1000,
"valid_targets_mean": 3355.1,
"valid_targets_min": 1473
},
{
"epoch": 1.6054313099041533,
"grad_norm": 0.636811929140562,
"learning_rate": 3.800750806147371e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4242017865180969,
"step": 1005,
"valid_targets_mean": 3736.1,
"valid_targets_min": 1562
},
{
"epoch": 1.6134185303514377,
"grad_norm": 0.7542875453304175,
"learning_rate": 3.79726974765276e-05,
"loss": 0.4566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4269424080848694,
"step": 1010,
"valid_targets_mean": 3016.4,
"valid_targets_min": 848
},
{
"epoch": 1.621405750798722,
"grad_norm": 0.6894222849805512,
"learning_rate": 3.793760165915947e-05,
"loss": 0.4412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4064532518386841,
"step": 1015,
"valid_targets_mean": 3785.7,
"valid_targets_min": 737
},
{
"epoch": 1.6293929712460065,
"grad_norm": 0.7778570976152539,
"learning_rate": 3.7902221166351106e-05,
"loss": 0.4165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4298957586288452,
"step": 1020,
"valid_targets_mean": 2434.3,
"valid_targets_min": 864
},
{
"epoch": 1.6373801916932909,
"grad_norm": 0.6857539738494024,
"learning_rate": 3.786655655960216e-05,
"loss": 0.4267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4040903151035309,
"step": 1025,
"valid_targets_mean": 2788.6,
"valid_targets_min": 1324
},
{
"epoch": 1.645367412140575,
"grad_norm": 0.7706739406760523,
"learning_rate": 3.7830608404921294e-05,
"loss": 0.4269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.457536906003952,
"step": 1030,
"valid_targets_mean": 2625.8,
"valid_targets_min": 1098
},
{
"epoch": 1.6533546325878594,
"grad_norm": 0.7189631307182224,
"learning_rate": 3.7794377272817144e-05,
"loss": 0.4513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4552885591983795,
"step": 1035,
"valid_targets_mean": 3002.1,
"valid_targets_min": 1346
},
{
"epoch": 1.6613418530351438,
"grad_norm": 0.6939968937775858,
"learning_rate": 3.775786373828929e-05,
"loss": 0.4401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42244094610214233,
"step": 1040,
"valid_targets_mean": 3193.0,
"valid_targets_min": 1181
},
{
"epoch": 1.669329073482428,
"grad_norm": 0.8310645339562641,
"learning_rate": 3.7721068380819135e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4165183901786804,
"step": 1045,
"valid_targets_mean": 2545.9,
"valid_targets_min": 1071
},
{
"epoch": 1.6773162939297124,
"grad_norm": 0.6767363971798981,
"learning_rate": 3.768399178436069e-05,
"loss": 0.439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44542649388313293,
"step": 1050,
"valid_targets_mean": 3308.1,
"valid_targets_min": 995
},
{
"epoch": 1.6853035143769968,
"grad_norm": 0.6972061039612378,
"learning_rate": 3.764663453733135e-05,
"loss": 0.4617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48311084508895874,
"step": 1055,
"valid_targets_mean": 3087.3,
"valid_targets_min": 1261
},
{
"epoch": 1.6932907348242812,
"grad_norm": 0.7005302044576569,
"learning_rate": 3.7608997232602475e-05,
"loss": 0.421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38864031434059143,
"step": 1060,
"valid_targets_mean": 2687.6,
"valid_targets_min": 923
},
{
"epoch": 1.7012779552715656,
"grad_norm": 0.6895071074838427,
"learning_rate": 3.757108046749006e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41667845845222473,
"step": 1065,
"valid_targets_mean": 2960.2,
"valid_targets_min": 1043
},
{
"epoch": 1.70926517571885,
"grad_norm": 0.7256933741627416,
"learning_rate": 3.753288484374524e-05,
"loss": 0.439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4952039420604706,
"step": 1070,
"valid_targets_mean": 2882.8,
"valid_targets_min": 1440
},
{
"epoch": 1.7172523961661343,
"grad_norm": 0.7266869951359273,
"learning_rate": 3.7494410967544674e-05,
"loss": 0.4438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4499083161354065,
"step": 1075,
"valid_targets_mean": 2684.9,
"valid_targets_min": 891
},
{
"epoch": 1.7252396166134185,
"grad_norm": 0.7287210054336749,
"learning_rate": 3.745565944948103e-05,
"loss": 0.4326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4443957507610321,
"step": 1080,
"valid_targets_mean": 3179.3,
"valid_targets_min": 1110
},
{
"epoch": 1.733226837060703,
"grad_norm": 0.7302401962493207,
"learning_rate": 3.7416630904553205e-05,
"loss": 0.42,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3901965618133545,
"step": 1085,
"valid_targets_mean": 2506.9,
"valid_targets_min": 1108
},
{
"epoch": 1.741214057507987,
"grad_norm": 0.7621719007011174,
"learning_rate": 3.737732595215663e-05,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49417999386787415,
"step": 1090,
"valid_targets_mean": 2648.5,
"valid_targets_min": 966
},
{
"epoch": 1.7492012779552715,
"grad_norm": 0.7488069211998931,
"learning_rate": 3.733774521607338e-05,
"loss": 0.4237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45603471994400024,
"step": 1095,
"valid_targets_mean": 2818.9,
"valid_targets_min": 1088
},
{
"epoch": 1.7571884984025559,
"grad_norm": 0.8084202592590568,
"learning_rate": 3.729788932446231e-05,
"loss": 0.4242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45258504152297974,
"step": 1100,
"valid_targets_mean": 2080.5,
"valid_targets_min": 1112
},
{
"epoch": 1.7651757188498403,
"grad_norm": 0.6611827236924629,
"learning_rate": 3.7257758909849107e-05,
"loss": 0.4394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44405344128608704,
"step": 1105,
"valid_targets_mean": 3858.6,
"valid_targets_min": 808
},
{
"epoch": 1.7731629392971247,
"grad_norm": 0.6162135150058156,
"learning_rate": 3.72173546091162e-05,
"loss": 0.4372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42961829900741577,
"step": 1110,
"valid_targets_mean": 3943.2,
"valid_targets_min": 1108
},
{
"epoch": 1.781150159744409,
"grad_norm": 0.7394032295272298,
"learning_rate": 3.7176677063492685e-05,
"loss": 0.4463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45540672540664673,
"step": 1115,
"valid_targets_mean": 2557.6,
"valid_targets_min": 970
},
{
"epoch": 1.7891373801916934,
"grad_norm": 0.7739659694704212,
"learning_rate": 3.713572691854414e-05,
"loss": 0.4132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4244069457054138,
"step": 1120,
"valid_targets_mean": 2507.1,
"valid_targets_min": 912
},
{
"epoch": 1.7971246006389776,
"grad_norm": 0.7905713199175826,
"learning_rate": 3.709450482416239e-05,
"loss": 0.4084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4046608805656433,
"step": 1125,
"valid_targets_mean": 2224.6,
"valid_targets_min": 1342
},
{
"epoch": 1.805111821086262,
"grad_norm": 0.7853975413698725,
"learning_rate": 3.7053011434555165e-05,
"loss": 0.4181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4040316343307495,
"step": 1130,
"valid_targets_mean": 2187.2,
"valid_targets_min": 949
},
{
"epoch": 1.8130990415335462,
"grad_norm": 1.5880148849392963,
"learning_rate": 3.701124740823575e-05,
"loss": 0.4296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4547976553440094,
"step": 1135,
"valid_targets_mean": 1833.9,
"valid_targets_min": 430
},
{
"epoch": 1.8210862619808306,
"grad_norm": 0.7259644824294608,
"learning_rate": 3.696921340801253e-05,
"loss": 0.4415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4141627550125122,
"step": 1140,
"valid_targets_mean": 3010.8,
"valid_targets_min": 1068
},
{
"epoch": 1.829073482428115,
"grad_norm": 0.6763295168488686,
"learning_rate": 3.6926910100978444e-05,
"loss": 0.4196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4594937860965729,
"step": 1145,
"valid_targets_mean": 3553.1,
"valid_targets_min": 923
},
{
"epoch": 1.8370607028753994,
"grad_norm": 0.7698782558795708,
"learning_rate": 3.688433815850041e-05,
"loss": 0.4235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4128667712211609,
"step": 1150,
"valid_targets_mean": 2459.1,
"valid_targets_min": 923
},
{
"epoch": 1.8450479233226837,
"grad_norm": 0.958655027556145,
"learning_rate": 3.68414982562087e-05,
"loss": 0.42,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4355429410934448,
"step": 1155,
"valid_targets_mean": 1698.6,
"valid_targets_min": 934
},
{
"epoch": 1.8530351437699681,
"grad_norm": 0.7513635672673216,
"learning_rate": 3.679839107398618e-05,
"loss": 0.4176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45161160826683044,
"step": 1160,
"valid_targets_mean": 3201.0,
"valid_targets_min": 1142
},
{
"epoch": 1.8610223642172525,
"grad_norm": 0.7754798547552919,
"learning_rate": 3.6755017295957536e-05,
"loss": 0.4402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47688138484954834,
"step": 1165,
"valid_targets_mean": 2819.0,
"valid_targets_min": 1346
},
{
"epoch": 1.8690095846645367,
"grad_norm": 0.7883052596756699,
"learning_rate": 3.67113776104784e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4371069669723511,
"step": 1170,
"valid_targets_mean": 2428.7,
"valid_targets_min": 1220
},
{
"epoch": 1.876996805111821,
"grad_norm": 0.6696947561840654,
"learning_rate": 3.6667472710124475e-05,
"loss": 0.4416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4349396228790283,
"step": 1175,
"valid_targets_mean": 3369.9,
"valid_targets_min": 1130
},
{
"epoch": 1.8849840255591053,
"grad_norm": 0.8979562437261165,
"learning_rate": 3.6623303291680465e-05,
"loss": 0.4152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4136584997177124,
"step": 1180,
"valid_targets_mean": 2837.1,
"valid_targets_min": 747
},
{
"epoch": 1.8929712460063897,
"grad_norm": 0.6747106007234754,
"learning_rate": 3.6578870056129086e-05,
"loss": 0.4259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39019960165023804,
"step": 1185,
"valid_targets_mean": 3195.2,
"valid_targets_min": 1219
},
{
"epoch": 1.900958466453674,
"grad_norm": 0.6216752591895326,
"learning_rate": 3.653417370863992e-05,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41113990545272827,
"step": 1190,
"valid_targets_mean": 3552.1,
"valid_targets_min": 1157
},
{
"epoch": 1.9089456869009584,
"grad_norm": 0.6107745396982358,
"learning_rate": 3.6489214958558206e-05,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4672267436981201,
"step": 1195,
"valid_targets_mean": 4152.6,
"valid_targets_min": 1233
},
{
"epoch": 1.9169329073482428,
"grad_norm": 0.6564451674349974,
"learning_rate": 3.644399451939358e-05,
"loss": 0.4168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39774927496910095,
"step": 1200,
"valid_targets_mean": 2968.9,
"valid_targets_min": 1242
},
{
"epoch": 1.9249201277955272,
"grad_norm": 0.7771431898711396,
"learning_rate": 3.639851310880881e-05,
"loss": 0.4622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5002536773681641,
"step": 1205,
"valid_targets_mean": 2619.9,
"valid_targets_min": 1063
},
{
"epoch": 1.9329073482428116,
"grad_norm": 0.7533507907086239,
"learning_rate": 3.635277144860834e-05,
"loss": 0.4209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4327402710914612,
"step": 1210,
"valid_targets_mean": 2435.6,
"valid_targets_min": 657
},
{
"epoch": 1.9408945686900958,
"grad_norm": 0.6838599740152425,
"learning_rate": 3.630677026472684e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42494964599609375,
"step": 1215,
"valid_targets_mean": 2926.8,
"valid_targets_min": 860
},
{
"epoch": 1.9488817891373802,
"grad_norm": 0.7046006759588175,
"learning_rate": 3.626051028721773e-05,
"loss": 0.4446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4118865132331848,
"step": 1220,
"valid_targets_mean": 2795.1,
"valid_targets_min": 740
},
{
"epoch": 1.9568690095846646,
"grad_norm": 0.7846235878176491,
"learning_rate": 3.621399225024156e-05,
"loss": 0.4277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4167096018791199,
"step": 1225,
"valid_targets_mean": 2380.5,
"valid_targets_min": 869
},
{
"epoch": 1.9648562300319488,
"grad_norm": 0.6729799838262991,
"learning_rate": 3.616721689205436e-05,
"loss": 0.4147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3980925381183624,
"step": 1230,
"valid_targets_mean": 2988.2,
"valid_targets_min": 1022
},
{
"epoch": 1.9728434504792332,
"grad_norm": 0.7826130416711469,
"learning_rate": 3.612018495499594e-05,
"loss": 0.4399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42765045166015625,
"step": 1235,
"valid_targets_mean": 2436.8,
"valid_targets_min": 1103
},
{
"epoch": 1.9808306709265175,
"grad_norm": 0.662773336531969,
"learning_rate": 3.6072897185478074e-05,
"loss": 0.4131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43413665890693665,
"step": 1240,
"valid_targets_mean": 3430.6,
"valid_targets_min": 1036
},
{
"epoch": 1.988817891373802,
"grad_norm": 0.6600752452234055,
"learning_rate": 3.6025354333972714e-05,
"loss": 0.4079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41904622316360474,
"step": 1245,
"valid_targets_mean": 3193.2,
"valid_targets_min": 1213
},
{
"epoch": 1.9968051118210863,
"grad_norm": 0.7364834761692404,
"learning_rate": 3.597755715500002e-05,
"loss": 0.4179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4459013342857361,
"step": 1250,
"valid_targets_mean": 2883.5,
"valid_targets_min": 1221
},
{
"epoch": 2.0047923322683707,
"grad_norm": 0.6757605852428736,
"learning_rate": 3.592950640711642e-05,
"loss": 0.3716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3445654511451721,
"step": 1255,
"valid_targets_mean": 2511.2,
"valid_targets_min": 1113
},
{
"epoch": 2.012779552715655,
"grad_norm": 0.7920973856730682,
"learning_rate": 3.5881202852902543e-05,
"loss": 0.3774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37682023644447327,
"step": 1260,
"valid_targets_mean": 2531.8,
"valid_targets_min": 803
},
{
"epoch": 2.0207667731629395,
"grad_norm": 0.7084485618774308,
"learning_rate": 3.583264725895117e-05,
"loss": 0.4095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40177470445632935,
"step": 1265,
"valid_targets_mean": 3139.1,
"valid_targets_min": 722
},
{
"epoch": 2.0287539936102235,
"grad_norm": 0.8654181955391402,
"learning_rate": 3.5783840395854984e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34793633222579956,
"step": 1270,
"valid_targets_mean": 2136.0,
"valid_targets_min": 784
},
{
"epoch": 2.036741214057508,
"grad_norm": 0.8291615059541649,
"learning_rate": 3.5734783038194446e-05,
"loss": 0.4007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46559375524520874,
"step": 1275,
"valid_targets_mean": 2901.5,
"valid_targets_min": 1184
},
{
"epoch": 2.0447284345047922,
"grad_norm": 0.7323741707579677,
"learning_rate": 3.5685475964525396e-05,
"loss": 0.3937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37584206461906433,
"step": 1280,
"valid_targets_mean": 3211.1,
"valid_targets_min": 957
},
{
"epoch": 2.0527156549520766,
"grad_norm": 0.7363883381038177,
"learning_rate": 3.5635919957366775e-05,
"loss": 0.398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41028380393981934,
"step": 1285,
"valid_targets_mean": 2933.5,
"valid_targets_min": 1190
},
{
"epoch": 2.060702875399361,
"grad_norm": 0.7315517816142877,
"learning_rate": 3.558611580318817e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4214468002319336,
"step": 1290,
"valid_targets_mean": 3097.8,
"valid_targets_min": 1193
},
{
"epoch": 2.0686900958466454,
"grad_norm": 0.7175863284248388,
"learning_rate": 3.5536064292397334e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38822758197784424,
"step": 1295,
"valid_targets_mean": 3118.4,
"valid_targets_min": 1089
},
{
"epoch": 2.07667731629393,
"grad_norm": 0.6909079310550906,
"learning_rate": 3.548576621932766e-05,
"loss": 0.4088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37539142370224,
"step": 1300,
"valid_targets_mean": 3059.8,
"valid_targets_min": 1378
},
{
"epoch": 2.084664536741214,
"grad_norm": 0.8341553393326651,
"learning_rate": 3.543522238222555e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39283639192581177,
"step": 1305,
"valid_targets_mean": 2444.9,
"valid_targets_min": 733
},
{
"epoch": 2.0926517571884986,
"grad_norm": 0.7467643791808043,
"learning_rate": 3.538443358323777e-05,
"loss": 0.3992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4031786322593689,
"step": 1310,
"valid_targets_mean": 3537.6,
"valid_targets_min": 671
},
{
"epoch": 2.1006389776357826,
"grad_norm": 0.7427721777091812,
"learning_rate": 3.5333400628398696e-05,
"loss": 0.3946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35075265169143677,
"step": 1315,
"valid_targets_mean": 3124.6,
"valid_targets_min": 1320
},
{
"epoch": 2.108626198083067,
"grad_norm": 0.723617897881399,
"learning_rate": 3.5282124327617556e-05,
"loss": 0.3989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4392593502998352,
"step": 1320,
"valid_targets_mean": 3268.4,
"valid_targets_min": 614
},
{
"epoch": 2.1166134185303513,
"grad_norm": 0.788438144653811,
"learning_rate": 3.5230605494665535e-05,
"loss": 0.3774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3712785840034485,
"step": 1325,
"valid_targets_mean": 2644.2,
"valid_targets_min": 463
},
{
"epoch": 2.1246006389776357,
"grad_norm": 0.8022216072730797,
"learning_rate": 3.517884494716289e-05,
"loss": 0.4069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4960511028766632,
"step": 1330,
"valid_targets_mean": 3651.8,
"valid_targets_min": 836
},
{
"epoch": 2.13258785942492,
"grad_norm": 0.6925487153270358,
"learning_rate": 3.512684350656596e-05,
"loss": 0.375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37404677271842957,
"step": 1335,
"valid_targets_mean": 3246.2,
"valid_targets_min": 1109
},
{
"epoch": 2.1405750798722045,
"grad_norm": 0.8170016680451098,
"learning_rate": 3.507460199815414e-05,
"loss": 0.407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3906192183494568,
"step": 1340,
"valid_targets_mean": 2524.4,
"valid_targets_min": 1046
},
{
"epoch": 2.148562300319489,
"grad_norm": 0.8211212957436506,
"learning_rate": 3.5022121251016786e-05,
"loss": 0.3728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36858224868774414,
"step": 1345,
"valid_targets_mean": 2289.2,
"valid_targets_min": 1063
},
{
"epoch": 2.1565495207667733,
"grad_norm": 0.7865399000617666,
"learning_rate": 3.4969402098040015e-05,
"loss": 0.3767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38670629262924194,
"step": 1350,
"valid_targets_mean": 2472.7,
"valid_targets_min": 723
},
{
"epoch": 2.1645367412140577,
"grad_norm": 0.6781855298456426,
"learning_rate": 3.491644537589356e-05,
"loss": 0.393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42566969990730286,
"step": 1355,
"valid_targets_mean": 3834.5,
"valid_targets_min": 1217
},
{
"epoch": 2.1725239616613417,
"grad_norm": 0.7316618715739758,
"learning_rate": 3.486325192501743e-05,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34030255675315857,
"step": 1360,
"valid_targets_mean": 2474.6,
"valid_targets_min": 851
},
{
"epoch": 2.180511182108626,
"grad_norm": 0.780177709972403,
"learning_rate": 3.480982258960859e-05,
"loss": 0.3992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4071018695831299,
"step": 1365,
"valid_targets_mean": 2566.9,
"valid_targets_min": 1108
},
{
"epoch": 2.1884984025559104,
"grad_norm": 0.7401670928315446,
"learning_rate": 3.47561582176076e-05,
"loss": 0.3765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34878408908843994,
"step": 1370,
"valid_targets_mean": 2431.8,
"valid_targets_min": 732
},
{
"epoch": 2.196485623003195,
"grad_norm": 0.8285074677263214,
"learning_rate": 3.470225966068507e-05,
"loss": 0.3942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38772809505462646,
"step": 1375,
"valid_targets_mean": 2775.9,
"valid_targets_min": 1309
},
{
"epoch": 2.2044728434504792,
"grad_norm": 0.6951035757973937,
"learning_rate": 3.464812777422826e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33720552921295166,
"step": 1380,
"valid_targets_mean": 2747.8,
"valid_targets_min": 1107
},
{
"epoch": 2.2124600638977636,
"grad_norm": 0.6933666013886233,
"learning_rate": 3.459376341732741e-05,
"loss": 0.3755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3822613060474396,
"step": 1385,
"valid_targets_mean": 3665.7,
"valid_targets_min": 1010
},
{
"epoch": 2.220447284345048,
"grad_norm": 0.844133409567668,
"learning_rate": 3.453916745276213e-05,
"loss": 0.3849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40487003326416016,
"step": 1390,
"valid_targets_mean": 2339.1,
"valid_targets_min": 1010
},
{
"epoch": 2.2284345047923324,
"grad_norm": 0.7635668779470315,
"learning_rate": 3.4484340746987745e-05,
"loss": 0.3745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40360257029533386,
"step": 1395,
"valid_targets_mean": 3000.1,
"valid_targets_min": 617
},
{
"epoch": 2.236421725239617,
"grad_norm": 0.8939714206815781,
"learning_rate": 3.4429284170121494e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39973244071006775,
"step": 1400,
"valid_targets_mean": 2310.8,
"valid_targets_min": 1108
},
{
"epoch": 2.244408945686901,
"grad_norm": 0.7965029242154419,
"learning_rate": 3.4373998595928764e-05,
"loss": 0.3769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35486793518066406,
"step": 1405,
"valid_targets_mean": 2493.4,
"valid_targets_min": 1100
},
{
"epoch": 2.252396166134185,
"grad_norm": 0.8968879107376081,
"learning_rate": 3.431848490180919e-05,
"loss": 0.385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3879396319389343,
"step": 1410,
"valid_targets_mean": 1842.8,
"valid_targets_min": 641
},
{
"epoch": 2.2603833865814695,
"grad_norm": 0.6571979135953678,
"learning_rate": 3.4262743968782736e-05,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3954229950904846,
"step": 1415,
"valid_targets_mean": 3515.6,
"valid_targets_min": 1404
},
{
"epoch": 2.268370607028754,
"grad_norm": 0.7277635785906069,
"learning_rate": 3.4206776681475737e-05,
"loss": 0.366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36266952753067017,
"step": 1420,
"valid_targets_mean": 2741.3,
"valid_targets_min": 1230
},
{
"epoch": 2.2763578274760383,
"grad_norm": 0.7907521602479675,
"learning_rate": 3.415058392810682e-05,
"loss": 0.4066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4322172999382019,
"step": 1425,
"valid_targets_mean": 2997.9,
"valid_targets_min": 1321
},
{
"epoch": 2.2843450479233227,
"grad_norm": 0.8176547611925157,
"learning_rate": 3.409416660047286e-05,
"loss": 0.3977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3814924955368042,
"step": 1430,
"valid_targets_mean": 2555.4,
"valid_targets_min": 1205
},
{
"epoch": 2.292332268370607,
"grad_norm": 0.822452014818755,
"learning_rate": 3.403752559393477e-05,
"loss": 0.3974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4026378393173218,
"step": 1435,
"valid_targets_mean": 2191.9,
"valid_targets_min": 958
},
{
"epoch": 2.3003194888178915,
"grad_norm": 0.8046031130809067,
"learning_rate": 3.398066180740332e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3843550384044647,
"step": 1440,
"valid_targets_mean": 2522.8,
"valid_targets_min": 1101
},
{
"epoch": 2.308306709265176,
"grad_norm": 0.7274042476803793,
"learning_rate": 3.39235761433249e-05,
"loss": 0.3742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3560572564601898,
"step": 1445,
"valid_targets_mean": 2997.4,
"valid_targets_min": 970
},
{
"epoch": 2.31629392971246,
"grad_norm": 0.7942573376789508,
"learning_rate": 3.386626950766713e-05,
"loss": 0.408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4524349570274353,
"step": 1450,
"valid_targets_mean": 2827.2,
"valid_targets_min": 847
},
{
"epoch": 2.3242811501597442,
"grad_norm": 0.7144054959460292,
"learning_rate": 3.380874280990454e-05,
"loss": 0.3819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43069761991500854,
"step": 1455,
"valid_targets_mean": 2820.1,
"valid_targets_min": 815
},
{
"epoch": 2.3322683706070286,
"grad_norm": 0.7615884351566543,
"learning_rate": 3.37509969630041e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3636676073074341,
"step": 1460,
"valid_targets_mean": 2552.9,
"valid_targets_min": 1197
},
{
"epoch": 2.340255591054313,
"grad_norm": 0.7256710670235811,
"learning_rate": 3.369303288341078e-05,
"loss": 0.3884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4177743196487427,
"step": 1465,
"valid_targets_mean": 3103.6,
"valid_targets_min": 1031
},
{
"epoch": 2.3482428115015974,
"grad_norm": 0.7877476651897006,
"learning_rate": 3.363485149103292e-05,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35964199900627136,
"step": 1470,
"valid_targets_mean": 2302.8,
"valid_targets_min": 1014
},
{
"epoch": 2.356230031948882,
"grad_norm": 0.7861951999481999,
"learning_rate": 3.357645370922772e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3646368682384491,
"step": 1475,
"valid_targets_mean": 2470.4,
"valid_targets_min": 892
},
{
"epoch": 2.364217252396166,
"grad_norm": 0.8067034022369052,
"learning_rate": 3.351784046478655e-05,
"loss": 0.3799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37805867195129395,
"step": 1480,
"valid_targets_mean": 2684.4,
"valid_targets_min": 903
},
{
"epoch": 2.3722044728434506,
"grad_norm": 0.6891254864220063,
"learning_rate": 3.345901268792022e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34303462505340576,
"step": 1485,
"valid_targets_mean": 2823.6,
"valid_targets_min": 1036
},
{
"epoch": 2.380191693290735,
"grad_norm": 0.6714839482371276,
"learning_rate": 3.3399971312244255e-05,
"loss": 0.3887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3872262239456177,
"step": 1490,
"valid_targets_mean": 3700.4,
"valid_targets_min": 1165
},
{
"epoch": 2.3881789137380194,
"grad_norm": 0.7565316440719079,
"learning_rate": 3.334071727476406e-05,
"loss": 0.4195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4261237680912018,
"step": 1495,
"valid_targets_mean": 2838.0,
"valid_targets_min": 1114
},
{
"epoch": 2.3961661341853033,
"grad_norm": 0.8114152537250999,
"learning_rate": 3.3281251515860035e-05,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45717281103134155,
"step": 1500,
"valid_targets_mean": 2492.4,
"valid_targets_min": 951
},
{
"epoch": 2.4041533546325877,
"grad_norm": 0.6856900658234324,
"learning_rate": 3.3221574979272676e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39079922437667847,
"step": 1505,
"valid_targets_mean": 3183.8,
"valid_targets_min": 1362
},
{
"epoch": 2.412140575079872,
"grad_norm": 0.7703186250399462,
"learning_rate": 3.316168861208759e-05,
"loss": 0.3763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39759039878845215,
"step": 1510,
"valid_targets_mean": 2748.0,
"valid_targets_min": 1040
},
{
"epoch": 2.4201277955271565,
"grad_norm": 0.8048967002212241,
"learning_rate": 3.310159336472047e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41734617948532104,
"step": 1515,
"valid_targets_mean": 2613.1,
"valid_targets_min": 1191
},
{
"epoch": 2.428115015974441,
"grad_norm": 0.8314543068705672,
"learning_rate": 3.304129019090198e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41389578580856323,
"step": 1520,
"valid_targets_mean": 2517.2,
"valid_targets_min": 891
},
{
"epoch": 2.4361022364217253,
"grad_norm": 0.6926011452341558,
"learning_rate": 3.298078004766267e-05,
"loss": 0.3905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37540772557258606,
"step": 1525,
"valid_targets_mean": 2965.9,
"valid_targets_min": 864
},
{
"epoch": 2.4440894568690097,
"grad_norm": 0.8162573999638001,
"learning_rate": 3.292006389531774e-05,
"loss": 0.3909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4161120355129242,
"step": 1530,
"valid_targets_mean": 2317.8,
"valid_targets_min": 848
},
{
"epoch": 2.452076677316294,
"grad_norm": 0.8074891222439363,
"learning_rate": 3.2859142697451835e-05,
"loss": 0.3772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37793317437171936,
"step": 1535,
"valid_targets_mean": 2300.7,
"valid_targets_min": 944
},
{
"epoch": 2.460063897763578,
"grad_norm": 0.6859073178237398,
"learning_rate": 3.279801742090372e-05,
"loss": 0.3817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3530294895172119,
"step": 1540,
"valid_targets_mean": 2976.5,
"valid_targets_min": 1095
},
{
"epoch": 2.4680511182108624,
"grad_norm": 0.7497080904501119,
"learning_rate": 3.2736689035750975e-05,
"loss": 0.4002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38208550214767456,
"step": 1545,
"valid_targets_mean": 2632.4,
"valid_targets_min": 1187
},
{
"epoch": 2.476038338658147,
"grad_norm": 0.7658848802289646,
"learning_rate": 3.2675158515294554e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34464403986930847,
"step": 1550,
"valid_targets_mean": 2718.4,
"valid_targets_min": 1097
},
{
"epoch": 2.484025559105431,
"grad_norm": 0.7295384665652668,
"learning_rate": 3.2613426836043386e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40557998418807983,
"step": 1555,
"valid_targets_mean": 2924.6,
"valid_targets_min": 1126
},
{
"epoch": 2.4920127795527156,
"grad_norm": 0.7865606199528011,
"learning_rate": 3.2551494977698844e-05,
"loss": 0.3832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3619915246963501,
"step": 1560,
"valid_targets_mean": 2832.5,
"valid_targets_min": 1204
},
{
"epoch": 2.5,
"grad_norm": 0.7442594029658458,
"learning_rate": 3.248936392313921e-05,
"loss": 0.3836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3640132546424866,
"step": 1565,
"valid_targets_mean": 2665.8,
"valid_targets_min": 1110
},
{
"epoch": 2.5079872204472844,
"grad_norm": 0.7749328364765504,
"learning_rate": 3.2427034658404056e-05,
"loss": 0.374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38298264145851135,
"step": 1570,
"valid_targets_mean": 2361.2,
"valid_targets_min": 895
},
{
"epoch": 2.515974440894569,
"grad_norm": 0.70714901394141,
"learning_rate": 3.236450817267863e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42880868911743164,
"step": 1575,
"valid_targets_mean": 3301.9,
"valid_targets_min": 1134
},
{
"epoch": 2.523961661341853,
"grad_norm": 0.711423892950476,
"learning_rate": 3.230178545827814e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3938032388687134,
"step": 1580,
"valid_targets_mean": 3337.3,
"valid_targets_min": 1438
},
{
"epoch": 2.5319488817891376,
"grad_norm": 0.8058935995764296,
"learning_rate": 3.223886751063201e-05,
"loss": 0.3766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3802354037761688,
"step": 1585,
"valid_targets_mean": 2979.3,
"valid_targets_min": 944
},
{
"epoch": 2.539936102236422,
"grad_norm": 0.7118888640775775,
"learning_rate": 3.2175755328268054e-05,
"loss": 0.374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3789049983024597,
"step": 1590,
"valid_targets_mean": 2948.6,
"valid_targets_min": 1146
},
{
"epoch": 2.547923322683706,
"grad_norm": 0.7725216659459194,
"learning_rate": 3.2112449912796675e-05,
"loss": 0.379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4516969919204712,
"step": 1595,
"valid_targets_mean": 2919.0,
"valid_targets_min": 1147
},
{
"epoch": 2.5559105431309903,
"grad_norm": 0.7527073447886554,
"learning_rate": 3.204895226889494e-05,
"loss": 0.3986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38789334893226624,
"step": 1600,
"valid_targets_mean": 2791.0,
"valid_targets_min": 1026
},
{
"epoch": 2.5638977635782747,
"grad_norm": 0.6299428402315908,
"learning_rate": 3.1985263404290634e-05,
"loss": 0.3749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.327023446559906,
"step": 1605,
"valid_targets_mean": 3438.7,
"valid_targets_min": 992
},
{
"epoch": 2.571884984025559,
"grad_norm": 0.9685044209773557,
"learning_rate": 3.19213843297463e-05,
"loss": 0.3827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4428490102291107,
"step": 1610,
"valid_targets_mean": 2068.7,
"valid_targets_min": 822
},
{
"epoch": 2.5798722044728435,
"grad_norm": 1.0295969468634165,
"learning_rate": 3.1857316059043144e-05,
"loss": 0.3998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4081227779388428,
"step": 1615,
"valid_targets_mean": 2919.2,
"valid_targets_min": 1251
},
{
"epoch": 2.587859424920128,
"grad_norm": 1.6563488775796265,
"learning_rate": 3.1793059608964986e-05,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4232986271381378,
"step": 1620,
"valid_targets_mean": 3450.8,
"valid_targets_min": 1362
},
{
"epoch": 2.5958466453674123,
"grad_norm": 0.9155041657894906,
"learning_rate": 3.172861599928212e-05,
"loss": 0.4202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4846240282058716,
"step": 1625,
"valid_targets_mean": 2145.2,
"valid_targets_min": 859
},
{
"epoch": 2.6038338658146962,
"grad_norm": 0.8120340384610485,
"learning_rate": 3.166398625273512e-05,
"loss": 0.3737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4154743552207947,
"step": 1630,
"valid_targets_mean": 2617.1,
"valid_targets_min": 1098
},
{
"epoch": 2.6118210862619806,
"grad_norm": 0.849225033810179,
"learning_rate": 3.15991713950186e-05,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4135674238204956,
"step": 1635,
"valid_targets_mean": 2334.0,
"valid_targets_min": 1142
},
{
"epoch": 2.619808306709265,
"grad_norm": 0.8157392444586056,
"learning_rate": 3.153417245476495e-05,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39707255363464355,
"step": 1640,
"valid_targets_mean": 2494.3,
"valid_targets_min": 870
},
{
"epoch": 2.6277955271565494,
"grad_norm": 0.6334451346931158,
"learning_rate": 3.146899046352804e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35084402561187744,
"step": 1645,
"valid_targets_mean": 3740.7,
"valid_targets_min": 1049
},
{
"epoch": 2.635782747603834,
"grad_norm": 0.7762569328884342,
"learning_rate": 3.140362645576676e-05,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37259939312934875,
"step": 1650,
"valid_targets_mean": 2511.3,
"valid_targets_min": 1421
},
{
"epoch": 2.643769968051118,
"grad_norm": 0.8186237289070231,
"learning_rate": 3.133808146882871e-05,
"loss": 0.3835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4084286093711853,
"step": 1655,
"valid_targets_mean": 2329.6,
"valid_targets_min": 778
},
{
"epoch": 2.6517571884984026,
"grad_norm": 0.7125590887289628,
"learning_rate": 3.1272356542933654e-05,
"loss": 0.3972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3703764081001282,
"step": 1660,
"valid_targets_mean": 2906.2,
"valid_targets_min": 1050
},
{
"epoch": 2.659744408945687,
"grad_norm": 0.731708037956391,
"learning_rate": 3.120645272115707e-05,
"loss": 0.3943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4325590431690216,
"step": 1665,
"valid_targets_mean": 2983.2,
"valid_targets_min": 1067
},
{
"epoch": 2.6677316293929714,
"grad_norm": 0.8035997324197389,
"learning_rate": 3.114037104941355e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38742709159851074,
"step": 1670,
"valid_targets_mean": 2473.9,
"valid_targets_min": 1059
},
{
"epoch": 2.6757188498402558,
"grad_norm": 0.6844167171779404,
"learning_rate": 3.1074112576440236e-05,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.368588924407959,
"step": 1675,
"valid_targets_mean": 2882.1,
"valid_targets_min": 1749
},
{
"epoch": 2.68370607028754,
"grad_norm": 0.6163401323400775,
"learning_rate": 3.1007678353780154e-05,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32983940839767456,
"step": 1680,
"valid_targets_mean": 3723.4,
"valid_targets_min": 878
},
{
"epoch": 2.6916932907348246,
"grad_norm": 0.6365023740994403,
"learning_rate": 3.094106943576553e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3705146908760071,
"step": 1685,
"valid_targets_mean": 3389.1,
"valid_targets_min": 948
},
{
"epoch": 2.6996805111821085,
"grad_norm": 0.7475402505642063,
"learning_rate": 3.087428687950108e-05,
"loss": 0.3958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43426042795181274,
"step": 1690,
"valid_targets_mean": 2593.7,
"valid_targets_min": 1178
},
{
"epoch": 2.707667731629393,
"grad_norm": 0.7686145007215354,
"learning_rate": 3.080733174484719e-05,
"loss": 0.3871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4154050350189209,
"step": 1695,
"valid_targets_mean": 2665.8,
"valid_targets_min": 1084
},
{
"epoch": 2.7156549520766773,
"grad_norm": 0.8563812199578894,
"learning_rate": 3.074020509440313e-05,
"loss": 0.3829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3860825300216675,
"step": 1700,
"valid_targets_mean": 2129.1,
"valid_targets_min": 879
},
{
"epoch": 2.7236421725239617,
"grad_norm": 0.75128835829166,
"learning_rate": 3.0672907993490183e-05,
"loss": 0.3772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4196065366268158,
"step": 1705,
"valid_targets_mean": 2710.2,
"valid_targets_min": 1105
},
{
"epoch": 2.731629392971246,
"grad_norm": 0.7438973966543126,
"learning_rate": 3.060544151013473e-05,
"loss": 0.383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38597315549850464,
"step": 1710,
"valid_targets_mean": 2584.2,
"valid_targets_min": 737
},
{
"epoch": 2.7396166134185305,
"grad_norm": 0.7183303748877556,
"learning_rate": 3.053780671505132e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3752416968345642,
"step": 1715,
"valid_targets_mean": 2927.7,
"valid_targets_min": 1360
},
{
"epoch": 2.747603833865815,
"grad_norm": 0.5587721821728815,
"learning_rate": 3.047000468162563e-05,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36852502822875977,
"step": 1720,
"valid_targets_mean": 4415.8,
"valid_targets_min": 848
},
{
"epoch": 2.755591054313099,
"grad_norm": 0.7912750974825519,
"learning_rate": 3.0402036485897496e-05,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3481713533401489,
"step": 1725,
"valid_targets_mean": 2150.6,
"valid_targets_min": 573
},
{
"epoch": 2.763578274760383,
"grad_norm": 0.7655378909490561,
"learning_rate": 3.0333903206543786e-05,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4195517897605896,
"step": 1730,
"valid_targets_mean": 2745.0,
"valid_targets_min": 1068
},
{
"epoch": 2.7715654952076676,
"grad_norm": 0.7429503561714476,
"learning_rate": 3.02656059248613e-05,
"loss": 0.3752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38314008712768555,
"step": 1735,
"valid_targets_mean": 2676.4,
"valid_targets_min": 1083
},
{
"epoch": 2.779552715654952,
"grad_norm": 0.6847140253857491,
"learning_rate": 3.0197145724749615e-05,
"loss": 0.3835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35597318410873413,
"step": 1740,
"valid_targets_mean": 2626.1,
"valid_targets_min": 907
},
{
"epoch": 2.7875399361022364,
"grad_norm": 0.7618474409520442,
"learning_rate": 3.0128523692693865e-05,
"loss": 0.3888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.353215754032135,
"step": 1745,
"valid_targets_mean": 2811.6,
"valid_targets_min": 857
},
{
"epoch": 2.7955271565495208,
"grad_norm": 0.6759274934133018,
"learning_rate": 3.005974091774751e-05,
"loss": 0.397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39466995000839233,
"step": 1750,
"valid_targets_mean": 3399.4,
"valid_targets_min": 901
},
{
"epoch": 2.803514376996805,
"grad_norm": 0.6799590705617894,
"learning_rate": 2.999079849151505e-05,
"loss": 0.399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43251582980155945,
"step": 1755,
"valid_targets_mean": 3441.4,
"valid_targets_min": 1312
},
{
"epoch": 2.8115015974440896,
"grad_norm": 0.6610130288469123,
"learning_rate": 2.992169750813471e-05,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39097756147384644,
"step": 1760,
"valid_targets_mean": 3311.8,
"valid_targets_min": 1011
},
{
"epoch": 2.819488817891374,
"grad_norm": 0.7671727157019489,
"learning_rate": 2.985243906426106e-05,
"loss": 0.3821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40966904163360596,
"step": 1765,
"valid_targets_mean": 2718.1,
"valid_targets_min": 995
},
{
"epoch": 2.8274760383386583,
"grad_norm": 0.6650031120553905,
"learning_rate": 2.9783024259047617e-05,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.425026535987854,
"step": 1770,
"valid_targets_mean": 3584.0,
"valid_targets_min": 1194
},
{
"epoch": 2.8354632587859427,
"grad_norm": 0.8517674686517855,
"learning_rate": 2.971345419412941e-05,
"loss": 0.3923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36157435178756714,
"step": 1775,
"valid_targets_mean": 2832.7,
"valid_targets_min": 1040
},
{
"epoch": 2.8434504792332267,
"grad_norm": 0.6566982803729622,
"learning_rate": 2.964372997360548e-05,
"loss": 0.388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33444786071777344,
"step": 1780,
"valid_targets_mean": 3122.9,
"valid_targets_min": 768
},
{
"epoch": 2.851437699680511,
"grad_norm": 0.7060484582940764,
"learning_rate": 2.957385270402137e-05,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37771087884902954,
"step": 1785,
"valid_targets_mean": 3694.4,
"valid_targets_min": 1073
},
{
"epoch": 2.8594249201277955,
"grad_norm": 0.7198209681558054,
"learning_rate": 2.9503823494351565e-05,
"loss": 0.3719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3737558126449585,
"step": 1790,
"valid_targets_mean": 3059.6,
"valid_targets_min": 1135
},
{
"epoch": 2.86741214057508,
"grad_norm": 0.7055818423441181,
"learning_rate": 2.9433643455981874e-05,
"loss": 0.3988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39843347668647766,
"step": 1795,
"valid_targets_mean": 3255.6,
"valid_targets_min": 927
},
{
"epoch": 2.8753993610223643,
"grad_norm": 0.7843389401141818,
"learning_rate": 2.9363313702691827e-05,
"loss": 0.3622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41534000635147095,
"step": 1800,
"valid_targets_mean": 2498.8,
"valid_targets_min": 1019
},
{
"epoch": 2.8833865814696487,
"grad_norm": 0.6724104574364067,
"learning_rate": 2.9292835350636957e-05,
"loss": 0.4022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38030463457107544,
"step": 1805,
"valid_targets_mean": 3430.4,
"valid_targets_min": 1112
},
{
"epoch": 2.891373801916933,
"grad_norm": 0.5916718834917873,
"learning_rate": 2.922220951833111e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31356799602508545,
"step": 1810,
"valid_targets_mean": 3772.6,
"valid_targets_min": 951
},
{
"epoch": 2.899361022364217,
"grad_norm": 0.7654937514668824,
"learning_rate": 2.9151437326628706e-05,
"loss": 0.3866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3887610137462616,
"step": 1815,
"valid_targets_mean": 2553.3,
"valid_targets_min": 936
},
{
"epoch": 2.9073482428115014,
"grad_norm": 0.7480115771607395,
"learning_rate": 2.908051989870692e-05,
"loss": 0.3894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3808180093765259,
"step": 1820,
"valid_targets_mean": 3117.8,
"valid_targets_min": 791
},
{
"epoch": 2.915335463258786,
"grad_norm": 0.7187356737229668,
"learning_rate": 2.9009458360047867e-05,
"loss": 0.3829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4151441752910614,
"step": 1825,
"valid_targets_mean": 2946.7,
"valid_targets_min": 1304
},
{
"epoch": 2.92332268370607,
"grad_norm": 0.6464747283506714,
"learning_rate": 2.8938253838420762e-05,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39368531107902527,
"step": 1830,
"valid_targets_mean": 3852.4,
"valid_targets_min": 875
},
{
"epoch": 2.9313099041533546,
"grad_norm": 0.7244350087292859,
"learning_rate": 2.8866907463864006e-05,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3935213088989258,
"step": 1835,
"valid_targets_mean": 2723.6,
"valid_targets_min": 988
},
{
"epoch": 2.939297124600639,
"grad_norm": 0.6851586503030473,
"learning_rate": 2.8795420368667225e-05,
"loss": 0.3717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41738811135292053,
"step": 1840,
"valid_targets_mean": 3267.9,
"valid_targets_min": 924
},
{
"epoch": 2.9472843450479234,
"grad_norm": 0.6915563143903232,
"learning_rate": 2.8723793687353354e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38308918476104736,
"step": 1845,
"valid_targets_mean": 3031.2,
"valid_targets_min": 974
},
{
"epoch": 2.9552715654952078,
"grad_norm": 0.6819090921664839,
"learning_rate": 2.8652028556660593e-05,
"loss": 0.4031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36406490206718445,
"step": 1850,
"valid_targets_mean": 3324.1,
"valid_targets_min": 1575
},
{
"epoch": 2.963258785942492,
"grad_norm": 0.7719683466940759,
"learning_rate": 2.8580126115524373e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38270652294158936,
"step": 1855,
"valid_targets_mean": 2710.7,
"valid_targets_min": 1122
},
{
"epoch": 2.9712460063897765,
"grad_norm": 0.7584408057005778,
"learning_rate": 2.8508087505059302e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40344762802124023,
"step": 1860,
"valid_targets_mean": 2602.8,
"valid_targets_min": 1057
},
{
"epoch": 2.979233226837061,
"grad_norm": 0.8095860463062092,
"learning_rate": 2.843591386854102e-05,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3777475953102112,
"step": 1865,
"valid_targets_mean": 2237.3,
"valid_targets_min": 1016
},
{
"epoch": 2.987220447284345,
"grad_norm": 0.8139871848333652,
"learning_rate": 2.8363606351388068e-05,
"loss": 0.4007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3748500943183899,
"step": 1870,
"valid_targets_mean": 2634.4,
"valid_targets_min": 981
},
{
"epoch": 2.9952076677316293,
"grad_norm": 0.6031621618600853,
"learning_rate": 2.829116610114375e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.309096097946167,
"step": 1875,
"valid_targets_mean": 3321.8,
"valid_targets_min": 918
},
{
"epoch": 3.0031948881789137,
"grad_norm": 0.7010853523494205,
"learning_rate": 2.821859426745786e-05,
"loss": 0.377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3830505609512329,
"step": 1880,
"valid_targets_mean": 3283.0,
"valid_targets_min": 1103
},
{
"epoch": 3.011182108626198,
"grad_norm": 0.7997009121695763,
"learning_rate": 2.8145892002068454e-05,
"loss": 0.3306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33155494928359985,
"step": 1885,
"valid_targets_mean": 2721.9,
"valid_targets_min": 1253
},
{
"epoch": 3.0191693290734825,
"grad_norm": 0.880787133238318,
"learning_rate": 2.8073060458783606e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31442296504974365,
"step": 1890,
"valid_targets_mean": 2083.6,
"valid_targets_min": 1019
},
{
"epoch": 3.027156549520767,
"grad_norm": 0.851278068434791,
"learning_rate": 2.8000100793463056e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33716338872909546,
"step": 1895,
"valid_targets_mean": 2149.1,
"valid_targets_min": 971
},
{
"epoch": 3.0351437699680512,
"grad_norm": 0.7724207654837609,
"learning_rate": 2.792701416399988e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37443485856056213,
"step": 1900,
"valid_targets_mean": 2977.1,
"valid_targets_min": 1171
},
{
"epoch": 3.0431309904153356,
"grad_norm": 0.8292296160816116,
"learning_rate": 2.7853801730302134e-05,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33334457874298096,
"step": 1905,
"valid_targets_mean": 2229.8,
"valid_targets_min": 1298
},
{
"epoch": 3.0511182108626196,
"grad_norm": 0.7738562965360346,
"learning_rate": 2.7780464654274396e-05,
"loss": 0.3521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34110739827156067,
"step": 1910,
"valid_targets_mean": 2591.9,
"valid_targets_min": 810
},
{
"epoch": 3.059105431309904,
"grad_norm": 0.7004842336637774,
"learning_rate": 2.770700409979938e-05,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2925085723400116,
"step": 1915,
"valid_targets_mean": 2646.9,
"valid_targets_min": 959
},
{
"epoch": 3.0670926517571884,
"grad_norm": 0.8088128682511053,
"learning_rate": 2.7633421232719442e-05,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3746018409729004,
"step": 1920,
"valid_targets_mean": 2762.9,
"valid_targets_min": 497
},
{
"epoch": 3.0750798722044728,
"grad_norm": 0.6921108063117793,
"learning_rate": 2.7559717220818067e-05,
"loss": 0.3419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33677250146865845,
"step": 1925,
"valid_targets_mean": 3465.4,
"valid_targets_min": 1438
},
{
"epoch": 3.083067092651757,
"grad_norm": 0.7792472115673951,
"learning_rate": 2.7485893233801366e-05,
"loss": 0.3499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3244081139564514,
"step": 1930,
"valid_targets_mean": 2584.4,
"valid_targets_min": 912
},
{
"epoch": 3.0910543130990416,
"grad_norm": 0.8282891276383806,
"learning_rate": 2.7411950443279458e-05,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3384396433830261,
"step": 1935,
"valid_targets_mean": 2538.3,
"valid_targets_min": 1040
},
{
"epoch": 3.099041533546326,
"grad_norm": 0.7315591962767853,
"learning_rate": 2.7337890022747945e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32630831003189087,
"step": 1940,
"valid_targets_mean": 3223.4,
"valid_targets_min": 907
},
{
"epoch": 3.1070287539936103,
"grad_norm": 0.6369586602339742,
"learning_rate": 2.7263713147569243e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34071576595306396,
"step": 1945,
"valid_targets_mean": 4314.2,
"valid_targets_min": 1241
},
{
"epoch": 3.1150159744408947,
"grad_norm": 0.7067109985051314,
"learning_rate": 2.7189420994953945e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37993860244750977,
"step": 1950,
"valid_targets_mean": 3673.4,
"valid_targets_min": 1263
},
{
"epoch": 3.123003194888179,
"grad_norm": 0.8025979082829126,
"learning_rate": 2.7115014743942114e-05,
"loss": 0.3525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3262211084365845,
"step": 1955,
"valid_targets_mean": 2655.9,
"valid_targets_min": 1046
},
{
"epoch": 3.130990415335463,
"grad_norm": 0.6708281987337977,
"learning_rate": 2.704049557538461e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34278061985969543,
"step": 1960,
"valid_targets_mean": 3530.3,
"valid_targets_min": 1110
},
{
"epoch": 3.1389776357827475,
"grad_norm": 0.732176646472642,
"learning_rate": 2.696586467192434e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36904671788215637,
"step": 1965,
"valid_targets_mean": 3570.9,
"valid_targets_min": 1321
},
{
"epoch": 3.146964856230032,
"grad_norm": 0.7557915517558162,
"learning_rate": 2.6891123217977448e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3248704969882965,
"step": 1970,
"valid_targets_mean": 3341.5,
"valid_targets_min": 972
},
{
"epoch": 3.1549520766773163,
"grad_norm": 0.8328040999163244,
"learning_rate": 2.681627239971458e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33000561594963074,
"step": 1975,
"valid_targets_mean": 2162.9,
"valid_targets_min": 937
},
{
"epoch": 3.1629392971246006,
"grad_norm": 0.6796313251895518,
"learning_rate": 2.6741313405041997e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34723204374313354,
"step": 1980,
"valid_targets_mean": 3633.1,
"valid_targets_min": 1367
},
{
"epoch": 3.170926517571885,
"grad_norm": 0.6915824013782956,
"learning_rate": 2.666624742358279e-05,
"loss": 0.3424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982881963253021,
"step": 1985,
"valid_targets_mean": 3259.9,
"valid_targets_min": 1035
},
{
"epoch": 3.1789137380191694,
"grad_norm": 0.8885716130967903,
"learning_rate": 2.659107564665794e-05,
"loss": 0.3507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38301947712898254,
"step": 1990,
"valid_targets_mean": 2289.6,
"valid_targets_min": 931
},
{
"epoch": 3.186900958466454,
"grad_norm": 0.7696659351010584,
"learning_rate": 2.6515799267267445e-05,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32373887300491333,
"step": 1995,
"valid_targets_mean": 2755.4,
"valid_targets_min": 1083
},
{
"epoch": 3.194888178913738,
"grad_norm": 0.666620619178921,
"learning_rate": 2.6440419480071366e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33515575528144836,
"step": 2000,
"valid_targets_mean": 3775.8,
"valid_targets_min": 938
},
{
"epoch": 3.202875399361022,
"grad_norm": 0.8605815354678277,
"learning_rate": 2.6364937481370887e-05,
"loss": 0.3315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32717159390449524,
"step": 2005,
"valid_targets_mean": 1861.2,
"valid_targets_min": 848
},
{
"epoch": 3.2108626198083066,
"grad_norm": 0.8139366969767636,
"learning_rate": 2.628935446908933e-05,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3549983501434326,
"step": 2010,
"valid_targets_mean": 2780.7,
"valid_targets_min": 924
},
{
"epoch": 3.218849840255591,
"grad_norm": 0.6178267872235499,
"learning_rate": 2.6213671642753124e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27505552768707275,
"step": 2015,
"valid_targets_mean": 3498.8,
"valid_targets_min": 901
},
{
"epoch": 3.2268370607028753,
"grad_norm": 0.7498197701531762,
"learning_rate": 2.6137890203472786e-05,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28516024351119995,
"step": 2020,
"valid_targets_mean": 2339.2,
"valid_targets_min": 1043
},
{
"epoch": 3.2348242811501597,
"grad_norm": 0.779750885550688,
"learning_rate": 2.606201135392383e-05,
"loss": 0.3565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32652050256729126,
"step": 2025,
"valid_targets_mean": 3031.4,
"valid_targets_min": 938
},
{
"epoch": 3.242811501597444,
"grad_norm": 0.8362104239003927,
"learning_rate": 2.5986036298327725e-05,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320258229970932,
"step": 2030,
"valid_targets_mean": 2208.7,
"valid_targets_min": 1122
},
{
"epoch": 3.2507987220447285,
"grad_norm": 0.7593338041815918,
"learning_rate": 2.590996624243276e-05,
"loss": 0.3248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3281738758087158,
"step": 2035,
"valid_targets_mean": 2861.4,
"valid_targets_min": 1047
},
{
"epoch": 3.258785942492013,
"grad_norm": 0.738061021392302,
"learning_rate": 2.5833802393494897e-05,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37253719568252563,
"step": 2040,
"valid_targets_mean": 3137.3,
"valid_targets_min": 873
},
{
"epoch": 3.2667731629392973,
"grad_norm": 0.805662472760199,
"learning_rate": 2.5757545960258638e-05,
"loss": 0.3443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35318508744239807,
"step": 2045,
"valid_targets_mean": 2663.6,
"valid_targets_min": 927
},
{
"epoch": 3.2747603833865817,
"grad_norm": 0.874774468106856,
"learning_rate": 2.5681198152937804e-05,
"loss": 0.3528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42066410183906555,
"step": 2050,
"valid_targets_mean": 2673.9,
"valid_targets_min": 1028
},
{
"epoch": 3.2827476038338657,
"grad_norm": 0.9367992662401398,
"learning_rate": 2.5604760183196377e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3702118396759033,
"step": 2055,
"valid_targets_mean": 2392.5,
"valid_targets_min": 732
},
{
"epoch": 3.29073482428115,
"grad_norm": 0.7835028898995575,
"learning_rate": 2.5528233264129228e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34959307312965393,
"step": 2060,
"valid_targets_mean": 2777.4,
"valid_targets_min": 1040
},
{
"epoch": 3.2987220447284344,
"grad_norm": 0.8490015562097194,
"learning_rate": 2.54516186102429e-05,
"loss": 0.3585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37757542729377747,
"step": 2065,
"valid_targets_mean": 2506.2,
"valid_targets_min": 1072
},
{
"epoch": 3.306709265175719,
"grad_norm": 0.829876673769117,
"learning_rate": 2.5374917437436294e-05,
"loss": 0.3498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3559834957122803,
"step": 2070,
"valid_targets_mean": 2435.7,
"valid_targets_min": 1130
},
{
"epoch": 3.3146964856230032,
"grad_norm": 0.7782930862626647,
"learning_rate": 2.5298130962981403e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32831066846847534,
"step": 2075,
"valid_targets_mean": 2370.1,
"valid_targets_min": 1399
},
{
"epoch": 3.3226837060702876,
"grad_norm": 0.6821850671644661,
"learning_rate": 2.5221260405503985e-05,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3372279405593872,
"step": 2080,
"valid_targets_mean": 3202.9,
"valid_targets_min": 1192
},
{
"epoch": 3.330670926517572,
"grad_norm": 0.706369945800584,
"learning_rate": 2.5144306984964225e-05,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3640979826450348,
"step": 2085,
"valid_targets_mean": 3496.9,
"valid_targets_min": 1220
},
{
"epoch": 3.3386581469648564,
"grad_norm": 0.6858521053933514,
"learning_rate": 2.5067271922637377e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.354512482881546,
"step": 2090,
"valid_targets_mean": 3103.3,
"valid_targets_min": 842
},
{
"epoch": 3.3466453674121404,
"grad_norm": 0.7050974701444196,
"learning_rate": 2.499015644109435e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.340786337852478,
"step": 2095,
"valid_targets_mean": 3263.6,
"valid_targets_min": 1263
},
{
"epoch": 3.3546325878594248,
"grad_norm": 0.7792547408720658,
"learning_rate": 2.491296176418236e-05,
"loss": 0.3488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31993260979652405,
"step": 2100,
"valid_targets_mean": 2408.8,
"valid_targets_min": 861
},
{
"epoch": 3.362619808306709,
"grad_norm": 0.8472394542146415,
"learning_rate": 2.4835689117005472e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3624585270881653,
"step": 2105,
"valid_targets_mean": 2521.1,
"valid_targets_min": 1138
},
{
"epoch": 3.3706070287539935,
"grad_norm": 0.685542276172253,
"learning_rate": 2.4758339725905152e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39794886112213135,
"step": 2110,
"valid_targets_mean": 3648.8,
"valid_targets_min": 1537
},
{
"epoch": 3.378594249201278,
"grad_norm": 0.8289815185367049,
"learning_rate": 2.4680914818440823e-05,
"loss": 0.3427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3529765009880066,
"step": 2115,
"valid_targets_mean": 2447.1,
"valid_targets_min": 1186
},
{
"epoch": 3.3865814696485623,
"grad_norm": 0.79580361575995,
"learning_rate": 2.4603415623370387e-05,
"loss": 0.3688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3427412509918213,
"step": 2120,
"valid_targets_mean": 2492.4,
"valid_targets_min": 1044
},
{
"epoch": 3.3945686900958467,
"grad_norm": 0.9174018660679429,
"learning_rate": 2.4525843370630697e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35740599036216736,
"step": 2125,
"valid_targets_mean": 2116.4,
"valid_targets_min": 743
},
{
"epoch": 3.402555910543131,
"grad_norm": 0.92058483539087,
"learning_rate": 2.4448199291318058e-05,
"loss": 0.3518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35286015272140503,
"step": 2130,
"valid_targets_mean": 2801.2,
"valid_targets_min": 871
},
{
"epoch": 3.4105431309904155,
"grad_norm": 0.786887928884236,
"learning_rate": 2.4370484617668707e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33476051688194275,
"step": 2135,
"valid_targets_mean": 2596.9,
"valid_targets_min": 742
},
{
"epoch": 3.4185303514377,
"grad_norm": 0.7258313848476246,
"learning_rate": 2.4292700583039194e-05,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3154415786266327,
"step": 2140,
"valid_targets_mean": 3060.0,
"valid_targets_min": 1183
},
{
"epoch": 3.426517571884984,
"grad_norm": 0.8298449989955331,
"learning_rate": 2.4214848421886893e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39987191557884216,
"step": 2145,
"valid_targets_mean": 2922.6,
"valid_targets_min": 708
},
{
"epoch": 3.4345047923322682,
"grad_norm": 0.8571042529668489,
"learning_rate": 2.4136929369750344e-05,
"loss": 0.3624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37515556812286377,
"step": 2150,
"valid_targets_mean": 2234.4,
"valid_targets_min": 763
},
{
"epoch": 3.4424920127795526,
"grad_norm": 0.69019555021873,
"learning_rate": 2.4058944663229672e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.341417133808136,
"step": 2155,
"valid_targets_mean": 3493.2,
"valid_targets_min": 1130
},
{
"epoch": 3.450479233226837,
"grad_norm": 0.7666734882023155,
"learning_rate": 2.398089553996696e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3008880019187927,
"step": 2160,
"valid_targets_mean": 2677.6,
"valid_targets_min": 1190
},
{
"epoch": 3.4584664536741214,
"grad_norm": 0.7843770052937605,
"learning_rate": 2.3902783238626604e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34043818712234497,
"step": 2165,
"valid_targets_mean": 2748.9,
"valid_targets_min": 782
},
{
"epoch": 3.466453674121406,
"grad_norm": 0.8052459554106886,
"learning_rate": 2.3824608998875652e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3473026156425476,
"step": 2170,
"valid_targets_mean": 2772.2,
"valid_targets_min": 1174
},
{
"epoch": 3.47444089456869,
"grad_norm": 0.7451939406088447,
"learning_rate": 2.3746374061364138e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29451632499694824,
"step": 2175,
"valid_targets_mean": 2728.6,
"valid_targets_min": 690
},
{
"epoch": 3.4824281150159746,
"grad_norm": 0.6512980105925289,
"learning_rate": 2.3668079667705404e-05,
"loss": 0.3495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34157970547676086,
"step": 2180,
"valid_targets_mean": 3575.4,
"valid_targets_min": 1726
},
{
"epoch": 3.4904153354632586,
"grad_norm": 0.7079499032301315,
"learning_rate": 2.3589727060456342e-05,
"loss": 0.3521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3626313805580139,
"step": 2185,
"valid_targets_mean": 3225.8,
"valid_targets_min": 1124
},
{
"epoch": 3.498402555910543,
"grad_norm": 0.7295675412562281,
"learning_rate": 2.3511317483097753e-05,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3401775658130646,
"step": 2190,
"valid_targets_mean": 2835.4,
"valid_targets_min": 1325
},
{
"epoch": 3.5063897763578273,
"grad_norm": 0.6970730857646832,
"learning_rate": 2.3432852180014548e-05,
"loss": 0.3578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32114821672439575,
"step": 2195,
"valid_targets_mean": 3394.9,
"valid_targets_min": 871
},
{
"epoch": 3.5143769968051117,
"grad_norm": 0.7359279593183425,
"learning_rate": 2.3354332396476026e-05,
"loss": 0.3304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3173915445804596,
"step": 2200,
"valid_targets_mean": 2769.9,
"valid_targets_min": 817
},
{
"epoch": 3.522364217252396,
"grad_norm": 0.8670971142439949,
"learning_rate": 2.327575937861612e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3821990489959717,
"step": 2205,
"valid_targets_mean": 2721.3,
"valid_targets_min": 1028
},
{
"epoch": 3.5303514376996805,
"grad_norm": 0.7495600483899891,
"learning_rate": 2.3197134373413595e-05,
"loss": 0.3565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3791123032569885,
"step": 2210,
"valid_targets_mean": 2959.6,
"valid_targets_min": 963
},
{
"epoch": 3.538338658146965,
"grad_norm": 0.7631701646338969,
"learning_rate": 2.3118458628672272e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33027756214141846,
"step": 2215,
"valid_targets_mean": 2739.8,
"valid_targets_min": 1139
},
{
"epoch": 3.5463258785942493,
"grad_norm": 0.7210960761349475,
"learning_rate": 2.3039733393001233e-05,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.314005970954895,
"step": 2220,
"valid_targets_mean": 3064.6,
"valid_targets_min": 1529
},
{
"epoch": 3.5543130990415337,
"grad_norm": 0.7300448411862375,
"learning_rate": 2.2960959915794998e-05,
"loss": 0.3464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3501545786857605,
"step": 2225,
"valid_targets_mean": 3272.5,
"valid_targets_min": 884
},
{
"epoch": 3.562300319488818,
"grad_norm": 0.7352570371980378,
"learning_rate": 2.2882139447213673e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.367412269115448,
"step": 2230,
"valid_targets_mean": 2964.4,
"valid_targets_min": 1122
},
{
"epoch": 3.5702875399361025,
"grad_norm": 0.7266777124532515,
"learning_rate": 2.280327323816317e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3345056176185608,
"step": 2235,
"valid_targets_mean": 3415.9,
"valid_targets_min": 1112
},
{
"epoch": 3.5782747603833864,
"grad_norm": 0.7833280724460969,
"learning_rate": 2.2724362540275288e-05,
"loss": 0.3541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3198665380477905,
"step": 2240,
"valid_targets_mean": 2523.6,
"valid_targets_min": 723
},
{
"epoch": 3.586261980830671,
"grad_norm": 0.6515565530417812,
"learning_rate": 2.2645408605887882e-05,
"loss": 0.3673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3271835446357727,
"step": 2245,
"valid_targets_mean": 3502.6,
"valid_targets_min": 999
},
{
"epoch": 3.594249201277955,
"grad_norm": 0.7096257136610091,
"learning_rate": 2.2566412688025003e-05,
"loss": 0.3645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3631103038787842,
"step": 2250,
"valid_targets_mean": 3502.5,
"valid_targets_min": 1024
},
{
"epoch": 3.6022364217252396,
"grad_norm": 0.9151425698789424,
"learning_rate": 2.2487376040376958e-05,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37757572531700134,
"step": 2255,
"valid_targets_mean": 3347.0,
"valid_targets_min": 877
},
{
"epoch": 3.610223642172524,
"grad_norm": 0.7347384259209934,
"learning_rate": 2.240829991728048e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34199997782707214,
"step": 2260,
"valid_targets_mean": 3051.1,
"valid_targets_min": 786
},
{
"epoch": 3.6182108626198084,
"grad_norm": 0.94549554675444,
"learning_rate": 2.2329185573698778e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36203259229660034,
"step": 2265,
"valid_targets_mean": 2668.2,
"valid_targets_min": 811
},
{
"epoch": 3.626198083067093,
"grad_norm": 0.711777124378337,
"learning_rate": 2.225003426520163e-05,
"loss": 0.3563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34062519669532776,
"step": 2270,
"valid_targets_mean": 3257.0,
"valid_targets_min": 1230
},
{
"epoch": 3.6341853035143767,
"grad_norm": 0.8097999383376286,
"learning_rate": 2.2170847247945466e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3180551528930664,
"step": 2275,
"valid_targets_mean": 2292.1,
"valid_targets_min": 1108
},
{
"epoch": 3.642172523961661,
"grad_norm": 0.7944952102142546,
"learning_rate": 2.209162577865342e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3482610881328583,
"step": 2280,
"valid_targets_mean": 2589.2,
"valid_targets_min": 1683
},
{
"epoch": 3.6501597444089455,
"grad_norm": 0.8244274418365245,
"learning_rate": 2.201237111459539e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3237827718257904,
"step": 2285,
"valid_targets_mean": 2413.6,
"valid_targets_min": 955
},
{
"epoch": 3.65814696485623,
"grad_norm": 0.8893899727490636,
"learning_rate": 2.193308451356809e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3441276252269745,
"step": 2290,
"valid_targets_mean": 2140.9,
"valid_targets_min": 1085
},
{
"epoch": 3.6661341853035143,
"grad_norm": 0.7931807861635283,
"learning_rate": 2.1853767233875084e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32396748661994934,
"step": 2295,
"valid_targets_mean": 2703.6,
"valid_targets_min": 1040
},
{
"epoch": 3.6741214057507987,
"grad_norm": 0.7323099605303646,
"learning_rate": 2.1774420534306812e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37023335695266724,
"step": 2300,
"valid_targets_mean": 3230.1,
"valid_targets_min": 847
},
{
"epoch": 3.682108626198083,
"grad_norm": 0.8215600687589895,
"learning_rate": 2.1695045674120615e-05,
"loss": 0.3269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3557538390159607,
"step": 2305,
"valid_targets_mean": 2377.7,
"valid_targets_min": 1184
},
{
"epoch": 3.6900958466453675,
"grad_norm": 0.8134770011066427,
"learning_rate": 2.1615643913020755e-05,
"loss": 0.3593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33311760425567627,
"step": 2310,
"valid_targets_mean": 2857.2,
"valid_targets_min": 1311
},
{
"epoch": 3.698083067092652,
"grad_norm": 0.812226985002325,
"learning_rate": 2.1536216511138423e-05,
"loss": 0.3628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3659121096134186,
"step": 2315,
"valid_targets_mean": 2604.5,
"valid_targets_min": 1130
},
{
"epoch": 3.7060702875399363,
"grad_norm": 0.8800310047756553,
"learning_rate": 2.145676472901174e-05,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3661636412143707,
"step": 2320,
"valid_targets_mean": 2165.9,
"valid_targets_min": 1010
},
{
"epoch": 3.7140575079872207,
"grad_norm": 0.7143058958135756,
"learning_rate": 2.1377289827565734e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33318227529525757,
"step": 2325,
"valid_targets_mean": 3463.3,
"valid_targets_min": 1056
},
{
"epoch": 3.722044728434505,
"grad_norm": 0.7011841853877164,
"learning_rate": 2.129779306809236e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31508100032806396,
"step": 2330,
"valid_targets_mean": 2909.1,
"valid_targets_min": 876
},
{
"epoch": 3.730031948881789,
"grad_norm": 0.8357370303330102,
"learning_rate": 2.121827571223046e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3638567328453064,
"step": 2335,
"valid_targets_mean": 2311.0,
"valid_targets_min": 747
},
{
"epoch": 3.7380191693290734,
"grad_norm": 0.8037478490130382,
"learning_rate": 2.113873902194575e-05,
"loss": 0.3573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37670642137527466,
"step": 2340,
"valid_targets_mean": 3250.2,
"valid_targets_min": 1181
},
{
"epoch": 3.746006389776358,
"grad_norm": 0.8700223589429951,
"learning_rate": 2.1059184259510786e-05,
"loss": 0.3657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.386318564414978,
"step": 2345,
"valid_targets_mean": 2267.0,
"valid_targets_min": 962
},
{
"epoch": 3.753993610223642,
"grad_norm": 0.7600210560294047,
"learning_rate": 2.0979612687484935e-05,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36681851744651794,
"step": 2350,
"valid_targets_mean": 2949.6,
"valid_targets_min": 1248
},
{
"epoch": 3.7619808306709266,
"grad_norm": 0.8561255238812737,
"learning_rate": 2.0900025568694334e-05,
"loss": 0.3649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4018840193748474,
"step": 2355,
"valid_targets_mean": 2649.2,
"valid_targets_min": 834
},
{
"epoch": 3.769968051118211,
"grad_norm": 0.7901922853076591,
"learning_rate": 2.082042416621187e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3670767843723297,
"step": 2360,
"valid_targets_mean": 2619.1,
"valid_targets_min": 855
},
{
"epoch": 3.777955271565495,
"grad_norm": 0.7216134214426689,
"learning_rate": 2.0740809743337095e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3147008419036865,
"step": 2365,
"valid_targets_mean": 2834.6,
"valid_targets_min": 917
},
{
"epoch": 3.7859424920127793,
"grad_norm": 0.7955391112654346,
"learning_rate": 2.0661183563576202e-05,
"loss": 0.3525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36277374625205994,
"step": 2370,
"valid_targets_mean": 2651.1,
"valid_targets_min": 988
},
{
"epoch": 3.7939297124600637,
"grad_norm": 0.772152693083288,
"learning_rate": 2.0581546890621986e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33806949853897095,
"step": 2375,
"valid_targets_mean": 2821.8,
"valid_targets_min": 1116
},
{
"epoch": 3.801916932907348,
"grad_norm": 0.8085716379516211,
"learning_rate": 2.0501900988333755e-05,
"loss": 0.3453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3489188551902771,
"step": 2380,
"valid_targets_mean": 2745.3,
"valid_targets_min": 430
},
{
"epoch": 3.8099041533546325,
"grad_norm": 0.6954666725539379,
"learning_rate": 2.0422247120717304e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3149593472480774,
"step": 2385,
"valid_targets_mean": 2903.2,
"valid_targets_min": 1232
},
{
"epoch": 3.817891373801917,
"grad_norm": 0.7492864017320584,
"learning_rate": 2.0342586551904824e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33550161123275757,
"step": 2390,
"valid_targets_mean": 2524.8,
"valid_targets_min": 1136
},
{
"epoch": 3.8258785942492013,
"grad_norm": 0.7379062354051015,
"learning_rate": 2.026292054613486e-05,
"loss": 0.3554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35174477100372314,
"step": 2395,
"valid_targets_mean": 3198.4,
"valid_targets_min": 1011
},
{
"epoch": 3.8338658146964857,
"grad_norm": 0.826138505521665,
"learning_rate": 2.0183250367732253e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3427872061729431,
"step": 2400,
"valid_targets_mean": 2487.9,
"valid_targets_min": 904
},
{
"epoch": 3.84185303514377,
"grad_norm": 0.7229382012400196,
"learning_rate": 2.0103577281088065e-05,
"loss": 0.3653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3543205261230469,
"step": 2405,
"valid_targets_mean": 3393.3,
"valid_targets_min": 836
},
{
"epoch": 3.8498402555910545,
"grad_norm": 0.7250967838290785,
"learning_rate": 2.00239025506395e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32540053129196167,
"step": 2410,
"valid_targets_mean": 3386.4,
"valid_targets_min": 1153
},
{
"epoch": 3.857827476038339,
"grad_norm": 0.8104290152544857,
"learning_rate": 1.9944227440849856e-05,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3654288053512573,
"step": 2415,
"valid_targets_mean": 2680.6,
"valid_targets_min": 1050
},
{
"epoch": 3.8658146964856233,
"grad_norm": 0.7592811553776619,
"learning_rate": 1.9864553216188454e-05,
"loss": 0.3425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3243311643600464,
"step": 2420,
"valid_targets_mean": 2721.1,
"valid_targets_min": 1003
},
{
"epoch": 3.873801916932907,
"grad_norm": 0.8600247524167637,
"learning_rate": 1.978488114111057e-05,
"loss": 0.3799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3664115369319916,
"step": 2425,
"valid_targets_mean": 2369.9,
"valid_targets_min": 897
},
{
"epoch": 3.8817891373801916,
"grad_norm": 0.9127949248834691,
"learning_rate": 1.970521248003735e-05,
"loss": 0.3522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3474576771259308,
"step": 2430,
"valid_targets_mean": 1944.6,
"valid_targets_min": 1207
},
{
"epoch": 3.889776357827476,
"grad_norm": 0.8067494948013632,
"learning_rate": 1.9625548497335783e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33465152978897095,
"step": 2435,
"valid_targets_mean": 2467.1,
"valid_targets_min": 927
},
{
"epoch": 3.8977635782747604,
"grad_norm": 0.880971732697506,
"learning_rate": 1.9545890457298592e-05,
"loss": 0.3521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.351280152797699,
"step": 2440,
"valid_targets_mean": 2193.3,
"valid_targets_min": 949
},
{
"epoch": 3.905750798722045,
"grad_norm": 0.8521094362994456,
"learning_rate": 1.9466239624124203e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3590460419654846,
"step": 2445,
"valid_targets_mean": 2435.9,
"valid_targets_min": 1120
},
{
"epoch": 3.913738019169329,
"grad_norm": 0.868802266909435,
"learning_rate": 1.938659726189663e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30706340074539185,
"step": 2450,
"valid_targets_mean": 2211.0,
"valid_targets_min": 857
},
{
"epoch": 3.9217252396166136,
"grad_norm": 0.8259636849763473,
"learning_rate": 1.9306964634565505e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3763893246650696,
"step": 2455,
"valid_targets_mean": 2577.2,
"valid_targets_min": 1141
},
{
"epoch": 3.9297124600638975,
"grad_norm": 0.8213105655209398,
"learning_rate": 1.9227343005925926e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3701975345611572,
"step": 2460,
"valid_targets_mean": 2671.8,
"valid_targets_min": 1206
},
{
"epoch": 3.937699680511182,
"grad_norm": 0.7207468257354757,
"learning_rate": 1.914773363959845e-05,
"loss": 0.3547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3682279586791992,
"step": 2465,
"valid_targets_mean": 3327.1,
"valid_targets_min": 1211
},
{
"epoch": 3.9456869009584663,
"grad_norm": 0.7740903599176833,
"learning_rate": 1.906813779900903e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3290952444076538,
"step": 2470,
"valid_targets_mean": 2429.8,
"valid_targets_min": 1173
},
{
"epoch": 3.9536741214057507,
"grad_norm": 0.6969816315594596,
"learning_rate": 1.8988556747368953e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31143099069595337,
"step": 2475,
"valid_targets_mean": 3285.7,
"valid_targets_min": 901
},
{
"epoch": 3.961661341853035,
"grad_norm": 0.6900509589111553,
"learning_rate": 1.890899174765481e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32233577966690063,
"step": 2480,
"valid_targets_mean": 3132.6,
"valid_targets_min": 1216
},
{
"epoch": 3.9696485623003195,
"grad_norm": 0.7531324107571046,
"learning_rate": 1.8829444062588433e-05,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3661973476409912,
"step": 2485,
"valid_targets_mean": 2683.5,
"valid_targets_min": 722
},
{
"epoch": 3.977635782747604,
"grad_norm": 0.8859610638059474,
"learning_rate": 1.8749914954616882e-05,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39797261357307434,
"step": 2490,
"valid_targets_mean": 2247.5,
"valid_targets_min": 920
},
{
"epoch": 3.9856230031948883,
"grad_norm": 0.727951884939237,
"learning_rate": 1.867040568589236e-05,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31643036007881165,
"step": 2495,
"valid_targets_mean": 3139.8,
"valid_targets_min": 733
},
{
"epoch": 3.9936102236421727,
"grad_norm": 0.7051175961125331,
"learning_rate": 1.859091751825225e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31299465894699097,
"step": 2500,
"valid_targets_mean": 2929.7,
"valid_targets_min": 1181
},
{
"epoch": 4.001597444089457,
"grad_norm": 0.7836980808537842,
"learning_rate": 1.8511451713199038e-05,
"loss": 0.337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320000022649765,
"step": 2505,
"valid_targets_mean": 2379.3,
"valid_targets_min": 803
},
{
"epoch": 4.0095846645367414,
"grad_norm": 0.7784914545094099,
"learning_rate": 1.843200953188031e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2952941060066223,
"step": 2510,
"valid_targets_mean": 3074.2,
"valid_targets_min": 1215
},
{
"epoch": 4.017571884984026,
"grad_norm": 0.7642112879241275,
"learning_rate": 1.8352592235068735e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2828487157821655,
"step": 2515,
"valid_targets_mean": 2811.1,
"valid_targets_min": 1026
},
{
"epoch": 4.02555910543131,
"grad_norm": 0.8934842633384591,
"learning_rate": 1.8273201083142056e-05,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3350905179977417,
"step": 2520,
"valid_targets_mean": 2196.1,
"valid_targets_min": 1139
},
{
"epoch": 4.033546325878595,
"grad_norm": 0.8830460996681451,
"learning_rate": 1.8193837336063096e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3144967257976532,
"step": 2525,
"valid_targets_mean": 2362.4,
"valid_targets_min": 829
},
{
"epoch": 4.041533546325879,
"grad_norm": 0.7589694170525213,
"learning_rate": 1.8114502253359745e-05,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.329261839389801,
"step": 2530,
"valid_targets_mean": 3463.7,
"valid_targets_min": 1162
},
{
"epoch": 4.0495207667731625,
"grad_norm": 2.6987601954147147,
"learning_rate": 1.8035197094104986e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3215765357017517,
"step": 2535,
"valid_targets_mean": 3010.8,
"valid_targets_min": 1144
},
{
"epoch": 4.057507987220447,
"grad_norm": 0.8913192131103218,
"learning_rate": 1.7955923116896908e-05,
"loss": 0.344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34397605061531067,
"step": 2540,
"valid_targets_mean": 2805.3,
"valid_targets_min": 916
},
{
"epoch": 4.065495207667731,
"grad_norm": 0.7455487784175526,
"learning_rate": 1.787668157983872e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35729163885116577,
"step": 2545,
"valid_targets_mean": 3363.3,
"valid_targets_min": 1378
},
{
"epoch": 4.073482428115016,
"grad_norm": 0.7873618036052649,
"learning_rate": 1.779747374051881e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31921112537384033,
"step": 2550,
"valid_targets_mean": 3040.9,
"valid_targets_min": 1310
},
{
"epoch": 4.0814696485623,
"grad_norm": 0.7841123654379275,
"learning_rate": 1.7718300855990767e-05,
"loss": 0.3238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30261629819869995,
"step": 2555,
"valid_targets_mean": 2832.1,
"valid_targets_min": 1085
},
{
"epoch": 4.0894568690095845,
"grad_norm": 0.8354232619995942,
"learning_rate": 1.7639164182753434e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2939416170120239,
"step": 2560,
"valid_targets_mean": 2348.6,
"valid_targets_min": 851
},
{
"epoch": 4.097444089456869,
"grad_norm": 0.8279010105207609,
"learning_rate": 1.7560064976730967e-05,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2960469722747803,
"step": 2565,
"valid_targets_mean": 2403.9,
"valid_targets_min": 1514
},
{
"epoch": 4.105431309904153,
"grad_norm": 0.7720855666104548,
"learning_rate": 1.7481004493252915e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29527148604393005,
"step": 2570,
"valid_targets_mean": 3140.0,
"valid_targets_min": 1130
},
{
"epoch": 4.113418530351438,
"grad_norm": 0.8561385263509396,
"learning_rate": 1.740198398703428e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3038601875305176,
"step": 2575,
"valid_targets_mean": 2381.4,
"valid_targets_min": 1130
},
{
"epoch": 4.121405750798722,
"grad_norm": 0.732786585841618,
"learning_rate": 1.7323004712155613e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31189507246017456,
"step": 2580,
"valid_targets_mean": 3734.1,
"valid_targets_min": 1187
},
{
"epoch": 4.1293929712460065,
"grad_norm": 0.7953181249120669,
"learning_rate": 1.724406792204312e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3025287389755249,
"step": 2585,
"valid_targets_mean": 2656.2,
"valid_targets_min": 1215
},
{
"epoch": 4.137380191693291,
"grad_norm": 0.7744633063634144,
"learning_rate": 1.7165174869448738e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2929438650608063,
"step": 2590,
"valid_targets_mean": 2507.7,
"valid_targets_min": 1224
},
{
"epoch": 4.145367412140575,
"grad_norm": 0.7745147678616877,
"learning_rate": 1.7086326806430298e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304587721824646,
"step": 2595,
"valid_targets_mean": 2938.4,
"valid_targets_min": 1284
},
{
"epoch": 4.15335463258786,
"grad_norm": 0.8991912650145979,
"learning_rate": 1.7007524984331623e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32008877396583557,
"step": 2600,
"valid_targets_mean": 2276.9,
"valid_targets_min": 988
},
{
"epoch": 4.161341853035144,
"grad_norm": 0.8738895750174318,
"learning_rate": 1.692877065376268e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30264782905578613,
"step": 2605,
"valid_targets_mean": 2370.2,
"valid_targets_min": 971
},
{
"epoch": 4.169329073482428,
"grad_norm": 0.8046516983143223,
"learning_rate": 1.6850065064579724e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3758092522621155,
"step": 2610,
"valid_targets_mean": 2888.1,
"valid_targets_min": 1101
},
{
"epoch": 4.177316293929713,
"grad_norm": 0.7816553623092369,
"learning_rate": 1.677140946586548e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018527328968048,
"step": 2615,
"valid_targets_mean": 3292.1,
"valid_targets_min": 823
},
{
"epoch": 4.185303514376997,
"grad_norm": 0.7701069701455311,
"learning_rate": 1.66928051059093e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29624032974243164,
"step": 2620,
"valid_targets_mean": 3122.0,
"valid_targets_min": 1020
},
{
"epoch": 4.193290734824281,
"grad_norm": 0.8468234652278214,
"learning_rate": 1.6614253232187363e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3546920120716095,
"step": 2625,
"valid_targets_mean": 3006.4,
"valid_targets_min": 985
},
{
"epoch": 4.201277955271565,
"grad_norm": 0.7804812824667207,
"learning_rate": 1.6535755091342876e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2810975909233093,
"step": 2630,
"valid_targets_mean": 3003.0,
"valid_targets_min": 1330
},
{
"epoch": 4.2092651757188495,
"grad_norm": 0.8314006980762537,
"learning_rate": 1.6457311929166286e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3335530161857605,
"step": 2635,
"valid_targets_mean": 2748.6,
"valid_targets_min": 797
},
{
"epoch": 4.217252396166134,
"grad_norm": 1.2682211032574355,
"learning_rate": 1.637892499057551e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32898035645484924,
"step": 2640,
"valid_targets_mean": 2015.6,
"valid_targets_min": 1038
},
{
"epoch": 4.225239616613418,
"grad_norm": 0.6756060081334775,
"learning_rate": 1.6300595519596177e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3469483256340027,
"step": 2645,
"valid_targets_mean": 4125.4,
"valid_targets_min": 906
},
{
"epoch": 4.233226837060703,
"grad_norm": 0.830457676846521,
"learning_rate": 1.6222324759341897e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.372150182723999,
"step": 2650,
"valid_targets_mean": 2774.6,
"valid_targets_min": 978
},
{
"epoch": 4.241214057507987,
"grad_norm": 0.8301772168189655,
"learning_rate": 1.6144113951994515e-05,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3426179885864258,
"step": 2655,
"valid_targets_mean": 2936.2,
"valid_targets_min": 1189
},
{
"epoch": 4.2492012779552715,
"grad_norm": 0.7442017453136883,
"learning_rate": 1.60659643387844e-05,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32107579708099365,
"step": 2660,
"valid_targets_mean": 3388.4,
"valid_targets_min": 929
},
{
"epoch": 4.257188498402556,
"grad_norm": 0.7989995875352693,
"learning_rate": 1.5987877159970765e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3555402457714081,
"step": 2665,
"valid_targets_mean": 2872.1,
"valid_targets_min": 1153
},
{
"epoch": 4.26517571884984,
"grad_norm": 0.9194992318413938,
"learning_rate": 1.5909853654821947e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34973281621932983,
"step": 2670,
"valid_targets_mean": 2280.6,
"valid_targets_min": 837
},
{
"epoch": 4.273162939297125,
"grad_norm": 0.7793815135340966,
"learning_rate": 1.583189506159579e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32121002674102783,
"step": 2675,
"valid_targets_mean": 3233.8,
"valid_targets_min": 1172
},
{
"epoch": 4.281150159744409,
"grad_norm": 0.7419814536244536,
"learning_rate": 1.575400261751993e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26411211490631104,
"step": 2680,
"valid_targets_mean": 2861.4,
"valid_targets_min": 888
},
{
"epoch": 4.289137380191693,
"grad_norm": 0.8190096841902706,
"learning_rate": 1.567617755877223e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31602364778518677,
"step": 2685,
"valid_targets_mean": 3839.0,
"valid_targets_min": 737
},
{
"epoch": 4.297124600638978,
"grad_norm": 0.8513254156626134,
"learning_rate": 1.5598421120461106e-05,
"loss": 0.324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34726378321647644,
"step": 2690,
"valid_targets_mean": 3125.2,
"valid_targets_min": 1159
},
{
"epoch": 4.305111821086262,
"grad_norm": 0.8742879239076529,
"learning_rate": 1.552073453660595e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2954450249671936,
"step": 2695,
"valid_targets_mean": 2049.4,
"valid_targets_min": 1043
},
{
"epoch": 4.313099041533547,
"grad_norm": 0.8803976612275924,
"learning_rate": 1.5443119040117544e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31700998544692993,
"step": 2700,
"valid_targets_mean": 2607.2,
"valid_targets_min": 1532
},
{
"epoch": 4.321086261980831,
"grad_norm": 0.7893323019925185,
"learning_rate": 1.536557586277849e-05,
"loss": 0.3269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3041345477104187,
"step": 2705,
"valid_targets_mean": 3251.6,
"valid_targets_min": 1152
},
{
"epoch": 4.329073482428115,
"grad_norm": 0.8702685258904816,
"learning_rate": 1.5288106235223655e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005998730659485,
"step": 2710,
"valid_targets_mean": 2477.4,
"valid_targets_min": 853
},
{
"epoch": 4.3370607028754,
"grad_norm": 0.6841522781915828,
"learning_rate": 1.521071138692066e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31260186433792114,
"step": 2715,
"valid_targets_mean": 3646.8,
"valid_targets_min": 1019
},
{
"epoch": 4.345047923322683,
"grad_norm": 0.8793770134129358,
"learning_rate": 1.5133392546150347e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3228303790092468,
"step": 2720,
"valid_targets_mean": 2257.6,
"valid_targets_min": 1119
},
{
"epoch": 4.353035143769968,
"grad_norm": 0.7356041781956482,
"learning_rate": 1.5056150939987303e-05,
"loss": 0.3233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978741526603699,
"step": 2725,
"valid_targets_mean": 3256.1,
"valid_targets_min": 1130
},
{
"epoch": 4.361022364217252,
"grad_norm": 0.8575488601782734,
"learning_rate": 1.4978987794280363e-05,
"loss": 0.338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3490545153617859,
"step": 2730,
"valid_targets_mean": 2729.2,
"valid_targets_min": 651
},
{
"epoch": 4.3690095846645365,
"grad_norm": 0.8487291733521595,
"learning_rate": 1.4901904333633179e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3031385540962219,
"step": 2735,
"valid_targets_mean": 2487.4,
"valid_targets_min": 969
},
{
"epoch": 4.376996805111821,
"grad_norm": 0.822564579116967,
"learning_rate": 1.4824901781384777e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2881549894809723,
"step": 2740,
"valid_targets_mean": 2674.9,
"valid_targets_min": 876
},
{
"epoch": 4.384984025559105,
"grad_norm": 0.869337603970582,
"learning_rate": 1.4747981359590138e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3272026777267456,
"step": 2745,
"valid_targets_mean": 2358.8,
"valid_targets_min": 1083
},
{
"epoch": 4.39297124600639,
"grad_norm": 0.8621433957032326,
"learning_rate": 1.4671144289000806e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3270319104194641,
"step": 2750,
"valid_targets_mean": 2623.6,
"valid_targets_min": 1187
},
{
"epoch": 4.400958466453674,
"grad_norm": 0.7737153035103758,
"learning_rate": 1.4594391789045513e-05,
"loss": 0.3145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3190346360206604,
"step": 2755,
"valid_targets_mean": 2979.1,
"valid_targets_min": 957
},
{
"epoch": 4.4089456869009584,
"grad_norm": 0.7196118582656776,
"learning_rate": 1.4517725077810835e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696632146835327,
"step": 2760,
"valid_targets_mean": 3125.1,
"valid_targets_min": 1003
},
{
"epoch": 4.416932907348243,
"grad_norm": 0.6494097240205376,
"learning_rate": 1.4441145372021847e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3023773431777954,
"step": 2765,
"valid_targets_mean": 3835.9,
"valid_targets_min": 1076
},
{
"epoch": 4.424920127795527,
"grad_norm": 0.7789314639253977,
"learning_rate": 1.4364653887022831e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32076117396354675,
"step": 2770,
"valid_targets_mean": 2887.3,
"valid_targets_min": 849
},
{
"epoch": 4.432907348242812,
"grad_norm": 0.8479733674287858,
"learning_rate": 1.4288251836757956e-05,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31372612714767456,
"step": 2775,
"valid_targets_mean": 2776.1,
"valid_targets_min": 1171
},
{
"epoch": 4.440894568690096,
"grad_norm": 0.7510027085556208,
"learning_rate": 1.4211940433752052e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128352165222168,
"step": 2780,
"valid_targets_mean": 3347.7,
"valid_targets_min": 1018
},
{
"epoch": 4.44888178913738,
"grad_norm": 1.0678801727890188,
"learning_rate": 1.4135720889091342e-05,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33587950468063354,
"step": 2785,
"valid_targets_mean": 2601.2,
"valid_targets_min": 1071
},
{
"epoch": 4.456869009584665,
"grad_norm": 0.7024654713140126,
"learning_rate": 1.4059594412404227e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28195154666900635,
"step": 2790,
"valid_targets_mean": 3657.8,
"valid_targets_min": 1431
},
{
"epoch": 4.464856230031949,
"grad_norm": 0.7937537911917101,
"learning_rate": 1.3983562211842094e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30999305844306946,
"step": 2795,
"valid_targets_mean": 3226.8,
"valid_targets_min": 1176
},
{
"epoch": 4.472843450479234,
"grad_norm": 0.8150515310476798,
"learning_rate": 1.390762549406013e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33410537242889404,
"step": 2800,
"valid_targets_mean": 2873.4,
"valid_targets_min": 983
},
{
"epoch": 4.480830670926517,
"grad_norm": 0.7481249885495977,
"learning_rate": 1.3831785464198188e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3242833912372589,
"step": 2805,
"valid_targets_mean": 3249.0,
"valid_targets_min": 924
},
{
"epoch": 4.488817891373802,
"grad_norm": 0.8863393546681068,
"learning_rate": 1.3756043325861648e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30686694383621216,
"step": 2810,
"valid_targets_mean": 2602.9,
"valid_targets_min": 1229
},
{
"epoch": 4.496805111821086,
"grad_norm": 0.8894834385161677,
"learning_rate": 1.3680400281102326e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2976420521736145,
"step": 2815,
"valid_targets_mean": 2074.1,
"valid_targets_min": 1041
},
{
"epoch": 4.50479233226837,
"grad_norm": 0.9310689795086521,
"learning_rate": 1.3604857530399378e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40471312403678894,
"step": 2820,
"valid_targets_mean": 2295.2,
"valid_targets_min": 430
},
{
"epoch": 4.512779552715655,
"grad_norm": 0.7523089341040629,
"learning_rate": 1.3529416272640278e-05,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931872308254242,
"step": 2825,
"valid_targets_mean": 2772.8,
"valid_targets_min": 1438
},
{
"epoch": 4.520766773162939,
"grad_norm": 0.8964434235440402,
"learning_rate": 1.3454077705101766e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35491257905960083,
"step": 2830,
"valid_targets_mean": 2291.6,
"valid_targets_min": 857
},
{
"epoch": 4.5287539936102235,
"grad_norm": 0.7823384694721772,
"learning_rate": 1.3378843023430856e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3356529772281647,
"step": 2835,
"valid_targets_mean": 3122.6,
"valid_targets_min": 1283
},
{
"epoch": 4.536741214057508,
"grad_norm": 0.8162940884992557,
"learning_rate": 1.3303713421625864e-05,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30902934074401855,
"step": 2840,
"valid_targets_mean": 2529.6,
"valid_targets_min": 992
},
{
"epoch": 4.544728434504792,
"grad_norm": 0.7970840712086852,
"learning_rate": 1.3228690092017452e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29649817943573,
"step": 2845,
"valid_targets_mean": 2565.8,
"valid_targets_min": 1298
},
{
"epoch": 4.552715654952077,
"grad_norm": 0.8158566717200522,
"learning_rate": 1.3153774225249705e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33489930629730225,
"step": 2850,
"valid_targets_mean": 2931.1,
"valid_targets_min": 1587
},
{
"epoch": 4.560702875399361,
"grad_norm": 0.9705943358780271,
"learning_rate": 1.3078967010261243e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36530590057373047,
"step": 2855,
"valid_targets_mean": 2347.4,
"valid_targets_min": 659
},
{
"epoch": 4.568690095846645,
"grad_norm": 0.867288807597881,
"learning_rate": 1.3004269634266357e-05,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3266403079032898,
"step": 2860,
"valid_targets_mean": 2646.6,
"valid_targets_min": 864
},
{
"epoch": 4.57667731629393,
"grad_norm": 0.85633385349373,
"learning_rate": 1.2929683282736135e-05,
"loss": 0.309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31155091524124146,
"step": 2865,
"valid_targets_mean": 2291.2,
"valid_targets_min": 1044
},
{
"epoch": 4.584664536741214,
"grad_norm": 0.8733957612598485,
"learning_rate": 1.285520913937969e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3596514165401459,
"step": 2870,
"valid_targets_mean": 2465.4,
"valid_targets_min": 697
},
{
"epoch": 4.592651757188499,
"grad_norm": 0.8439557548254832,
"learning_rate": 1.2780848386125354e-05,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3084920644760132,
"step": 2875,
"valid_targets_mean": 2439.3,
"valid_targets_min": 1096
},
{
"epoch": 4.600638977635783,
"grad_norm": 0.7574914303418859,
"learning_rate": 1.2706602203101913e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2827756404876709,
"step": 2880,
"valid_targets_mean": 2762.9,
"valid_targets_min": 860
},
{
"epoch": 4.608626198083067,
"grad_norm": 0.8187552779251025,
"learning_rate": 1.2632471768619894e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3288748860359192,
"step": 2885,
"valid_targets_mean": 2768.2,
"valid_targets_min": 1053
},
{
"epoch": 4.616613418530352,
"grad_norm": 0.7875128783332611,
"learning_rate": 1.255845825915286e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29355835914611816,
"step": 2890,
"valid_targets_mean": 2613.6,
"valid_targets_min": 1075
},
{
"epoch": 4.624600638977636,
"grad_norm": 0.8034781377355279,
"learning_rate": 1.248456284931873e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3028643727302551,
"step": 2895,
"valid_targets_mean": 2869.2,
"valid_targets_min": 1386
},
{
"epoch": 4.63258785942492,
"grad_norm": 0.7962900798710767,
"learning_rate": 1.241078671186115e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.346049040555954,
"step": 2900,
"valid_targets_mean": 2883.4,
"valid_targets_min": 1294
},
{
"epoch": 4.640575079872205,
"grad_norm": 0.8023873273428883,
"learning_rate": 1.2337131017630873e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3004358410835266,
"step": 2905,
"valid_targets_mean": 2556.7,
"valid_targets_min": 891
},
{
"epoch": 4.6485623003194885,
"grad_norm": 0.8977806884389504,
"learning_rate": 1.2263596935567175e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32839423418045044,
"step": 2910,
"valid_targets_mean": 3472.2,
"valid_targets_min": 1178
},
{
"epoch": 4.656549520766773,
"grad_norm": 0.7106582489525565,
"learning_rate": 1.2190185632679316e-05,
"loss": 0.3118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2885178327560425,
"step": 2915,
"valid_targets_mean": 3290.6,
"valid_targets_min": 912
},
{
"epoch": 4.664536741214057,
"grad_norm": 0.667191215845006,
"learning_rate": 1.2116898274028008e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2748382091522217,
"step": 2920,
"valid_targets_mean": 4097.6,
"valid_targets_min": 1180
},
{
"epoch": 4.672523961661342,
"grad_norm": 0.8255323403479464,
"learning_rate": 1.2043736022706934e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34103143215179443,
"step": 2925,
"valid_targets_mean": 2534.6,
"valid_targets_min": 1061
},
{
"epoch": 4.680511182108626,
"grad_norm": 1.0630168206337054,
"learning_rate": 1.1970700039824271e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3425711989402771,
"step": 2930,
"valid_targets_mean": 2254.5,
"valid_targets_min": 742
},
{
"epoch": 4.68849840255591,
"grad_norm": 0.8323979797486944,
"learning_rate": 1.1897791484484284e-05,
"loss": 0.3184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31606024503707886,
"step": 2935,
"valid_targets_mean": 2571.6,
"valid_targets_min": 747
},
{
"epoch": 4.696485623003195,
"grad_norm": 0.7798233457306829,
"learning_rate": 1.182501151376893e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2969059944152832,
"step": 2940,
"valid_targets_mean": 2631.4,
"valid_targets_min": 1289
},
{
"epoch": 4.704472843450479,
"grad_norm": 0.717355278192079,
"learning_rate": 1.1752361282719472e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2805374264717102,
"step": 2945,
"valid_targets_mean": 3219.2,
"valid_targets_min": 1478
},
{
"epoch": 4.712460063897764,
"grad_norm": 0.8644521598904813,
"learning_rate": 1.1679841944318171e-05,
"loss": 0.3269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.317280113697052,
"step": 2950,
"valid_targets_mean": 2483.1,
"valid_targets_min": 927
},
{
"epoch": 4.720447284345048,
"grad_norm": 0.8645726435153137,
"learning_rate": 1.1607454649469991e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2650579810142517,
"step": 2955,
"valid_targets_mean": 2288.5,
"valid_targets_min": 869
},
{
"epoch": 4.728434504792332,
"grad_norm": 0.7976688949944475,
"learning_rate": 1.1535200546984291e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30540648102760315,
"step": 2960,
"valid_targets_mean": 2663.8,
"valid_targets_min": 1342
},
{
"epoch": 4.736421725239617,
"grad_norm": 0.8664261433843101,
"learning_rate": 1.1463080783556663e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3349177837371826,
"step": 2965,
"valid_targets_mean": 2668.2,
"valid_targets_min": 1079
},
{
"epoch": 4.744408945686901,
"grad_norm": 0.7406641800839713,
"learning_rate": 1.139109650375066e-05,
"loss": 0.3318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3015572130680084,
"step": 2970,
"valid_targets_mean": 3056.8,
"valid_targets_min": 1715
},
{
"epoch": 4.752396166134186,
"grad_norm": 0.857312699295414,
"learning_rate": 1.1319248849979705e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35463592410087585,
"step": 2975,
"valid_targets_mean": 3039.2,
"valid_targets_min": 1433
},
{
"epoch": 4.76038338658147,
"grad_norm": 0.8450913381311652,
"learning_rate": 1.1247538962488882e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3202403783798218,
"step": 2980,
"valid_targets_mean": 2744.7,
"valid_targets_min": 901
},
{
"epoch": 4.768370607028754,
"grad_norm": 0.7830697313162523,
"learning_rate": 1.1175967979336913e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3308242857456207,
"step": 2985,
"valid_targets_mean": 3116.3,
"valid_targets_min": 1017
},
{
"epoch": 4.776357827476039,
"grad_norm": 0.7830125935395612,
"learning_rate": 1.1104537036378054e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3096255660057068,
"step": 2990,
"valid_targets_mean": 3076.9,
"valid_targets_min": 1036
},
{
"epoch": 4.784345047923322,
"grad_norm": 0.8355403682431177,
"learning_rate": 1.1033247267244063e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30156558752059937,
"step": 2995,
"valid_targets_mean": 2738.4,
"valid_targets_min": 1026
},
{
"epoch": 4.792332268370607,
"grad_norm": 0.7250424081419844,
"learning_rate": 1.0962099803326257e-05,
"loss": 0.313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28947603702545166,
"step": 3000,
"valid_targets_mean": 3327.1,
"valid_targets_min": 931
},
{
"epoch": 4.800319488817891,
"grad_norm": 0.9386381305034504,
"learning_rate": 1.089109577375748e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33451300859451294,
"step": 3005,
"valid_targets_mean": 1926.2,
"valid_targets_min": 949
},
{
"epoch": 4.8083067092651754,
"grad_norm": 0.9607923151156983,
"learning_rate": 1.082023630539427e-05,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3341418504714966,
"step": 3010,
"valid_targets_mean": 2006.8,
"valid_targets_min": 944
},
{
"epoch": 4.81629392971246,
"grad_norm": 0.8329571872141134,
"learning_rate": 1.07495225227989e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35894811153411865,
"step": 3015,
"valid_targets_mean": 2908.5,
"valid_targets_min": 887
},
{
"epoch": 4.824281150159744,
"grad_norm": 0.8370383236843801,
"learning_rate": 1.0678955548221595e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3370824456214905,
"step": 3020,
"valid_targets_mean": 2618.8,
"valid_targets_min": 1134
},
{
"epoch": 4.832268370607029,
"grad_norm": 0.9448990709923799,
"learning_rate": 1.0608536501582654e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34659168124198914,
"step": 3025,
"valid_targets_mean": 2263.4,
"valid_targets_min": 1230
},
{
"epoch": 4.840255591054313,
"grad_norm": 0.8223141685878618,
"learning_rate": 1.0538266500454739e-05,
"loss": 0.3247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35333919525146484,
"step": 3030,
"valid_targets_mean": 3194.6,
"valid_targets_min": 960
},
{
"epoch": 4.848242811501597,
"grad_norm": 0.8144903161010786,
"learning_rate": 1.0468146660045118e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2987595498561859,
"step": 3035,
"valid_targets_mean": 2810.4,
"valid_targets_min": 681
},
{
"epoch": 4.856230031948882,
"grad_norm": 0.9075766431749717,
"learning_rate": 1.0398178093177928e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3274604380130768,
"step": 3040,
"valid_targets_mean": 2483.5,
"valid_targets_min": 948
},
{
"epoch": 4.864217252396166,
"grad_norm": 0.7273114917343588,
"learning_rate": 1.0328361910276592e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3381314277648926,
"step": 3045,
"valid_targets_mean": 3621.1,
"valid_targets_min": 1769
},
{
"epoch": 4.872204472843451,
"grad_norm": 0.7820761358000989,
"learning_rate": 1.0258699219346091e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27850645780563354,
"step": 3050,
"valid_targets_mean": 3137.2,
"valid_targets_min": 1036
},
{
"epoch": 4.880191693290735,
"grad_norm": 0.8361404113450691,
"learning_rate": 1.0189191125955503e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.328288197517395,
"step": 3055,
"valid_targets_mean": 2804.3,
"valid_targets_min": 1316
},
{
"epoch": 4.888178913738019,
"grad_norm": 0.8866370829805829,
"learning_rate": 1.0119838733220342e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30976438522338867,
"step": 3060,
"valid_targets_mean": 2255.0,
"valid_targets_min": 1081
},
{
"epoch": 4.896166134185304,
"grad_norm": 0.7548674340256988,
"learning_rate": 1.0050643141785148e-05,
"loss": 0.323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.296387642621994,
"step": 3065,
"valid_targets_mean": 2844.9,
"valid_targets_min": 1408
},
{
"epoch": 4.904153354632588,
"grad_norm": 0.8332532662745489,
"learning_rate": 9.981605449805933e-06,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2925332188606262,
"step": 3070,
"valid_targets_mean": 2291.7,
"valid_targets_min": 1238
},
{
"epoch": 4.912140575079873,
"grad_norm": 0.8598926872352152,
"learning_rate": 9.912726752932823e-06,
"loss": 0.3198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32179611921310425,
"step": 3075,
"valid_targets_mean": 2410.4,
"valid_targets_min": 1110
},
{
"epoch": 4.920127795527156,
"grad_norm": 0.7424748231440373,
"learning_rate": 9.844008144292643e-06,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29315125942230225,
"step": 3080,
"valid_targets_mean": 3143.2,
"valid_targets_min": 1075
},
{
"epoch": 4.928115015974441,
"grad_norm": 0.9235518733511646,
"learning_rate": 9.775450714471537e-06,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3396497070789337,
"step": 3085,
"valid_targets_mean": 2151.2,
"valid_targets_min": 972
},
{
"epoch": 4.936102236421725,
"grad_norm": 0.6816211371601565,
"learning_rate": 9.707055551497734e-06,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29893457889556885,
"step": 3090,
"valid_targets_mean": 3611.6,
"valid_targets_min": 1289
},
{
"epoch": 4.944089456869009,
"grad_norm": 0.8170219219392088,
"learning_rate": 9.638823740824177e-06,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2988799214363098,
"step": 3095,
"valid_targets_mean": 2490.7,
"valid_targets_min": 1019
},
{
"epoch": 4.952076677316294,
"grad_norm": 0.7458396020996966,
"learning_rate": 9.570756365311418e-06,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32337093353271484,
"step": 3100,
"valid_targets_mean": 3530.2,
"valid_targets_min": 1258
},
{
"epoch": 4.960063897763578,
"grad_norm": 0.7455812050660711,
"learning_rate": 9.502854505210326e-06,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3213096857070923,
"step": 3105,
"valid_targets_mean": 2728.7,
"valid_targets_min": 1108
},
{
"epoch": 4.968051118210862,
"grad_norm": 0.7843594515963668,
"learning_rate": 9.435119238145018e-06,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3219505548477173,
"step": 3110,
"valid_targets_mean": 3162.7,
"valid_targets_min": 357
},
{
"epoch": 4.976038338658147,
"grad_norm": 0.7656830597494546,
"learning_rate": 9.367551639095704e-06,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33506011962890625,
"step": 3115,
"valid_targets_mean": 3141.4,
"valid_targets_min": 1192
},
{
"epoch": 4.984025559105431,
"grad_norm": 0.9724543109745135,
"learning_rate": 9.300152780381664e-06,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3792024254798889,
"step": 3120,
"valid_targets_mean": 2552.1,
"valid_targets_min": 875
},
{
"epoch": 4.992012779552716,
"grad_norm": 0.748363011262852,
"learning_rate": 9.232923731644216e-06,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2932063043117523,
"step": 3125,
"valid_targets_mean": 3223.9,
"valid_targets_min": 1187
},
{
"epoch": 5.0,
"grad_norm": 0.7872370648886844,
"learning_rate": 9.16586555982972e-06,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28079310059547424,
"step": 3130,
"valid_targets_mean": 2799.1,
"valid_targets_min": 1113
},
{
"epoch": 5.007987220447284,
"grad_norm": 0.7939193129172704,
"learning_rate": 9.098979329172702e-06,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27301716804504395,
"step": 3135,
"valid_targets_mean": 2498.5,
"valid_targets_min": 732
},
{
"epoch": 5.015974440894569,
"grad_norm": 0.8161794104869049,
"learning_rate": 9.032266101178872e-06,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30852165818214417,
"step": 3140,
"valid_targets_mean": 2731.8,
"valid_targets_min": 857
},
{
"epoch": 5.023961661341853,
"grad_norm": 0.9254348282198132,
"learning_rate": 8.965726934608392e-06,
"loss": 0.2954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2905504107475281,
"step": 3145,
"valid_targets_mean": 2591.9,
"valid_targets_min": 913
},
{
"epoch": 5.031948881789138,
"grad_norm": 0.6971325615014937,
"learning_rate": 8.899362885458964e-06,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28469550609588623,
"step": 3150,
"valid_targets_mean": 3842.1,
"valid_targets_min": 990
},
{
"epoch": 5.039936102236422,
"grad_norm": 0.8228394781114576,
"learning_rate": 8.833175006949165e-06,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2873718738555908,
"step": 3155,
"valid_targets_mean": 2796.2,
"valid_targets_min": 690
},
{
"epoch": 5.047923322683706,
"grad_norm": 0.7756264018207162,
"learning_rate": 8.767164349501648e-06,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2786628305912018,
"step": 3160,
"valid_targets_mean": 3256.9,
"valid_targets_min": 1270
},
{
"epoch": 5.055910543130991,
"grad_norm": 0.9177797446364668,
"learning_rate": 8.70133196072654e-06,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31999728083610535,
"step": 3165,
"valid_targets_mean": 2434.4,
"valid_targets_min": 1327
},
{
"epoch": 5.063897763578275,
"grad_norm": 0.8631163026077268,
"learning_rate": 8.63567888540478e-06,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3382035493850708,
"step": 3170,
"valid_targets_mean": 2910.9,
"valid_targets_min": 1067
},
{
"epoch": 5.0718849840255595,
"grad_norm": 0.8946157821444155,
"learning_rate": 8.570206165471535e-06,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751600742340088,
"step": 3175,
"valid_targets_mean": 2490.8,
"valid_targets_min": 755
},
{
"epoch": 5.079872204472843,
"grad_norm": 0.8297010600531302,
"learning_rate": 8.504914839999691e-06,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27816468477249146,
"step": 3180,
"valid_targets_mean": 2886.9,
"valid_targets_min": 1381
},
{
"epoch": 5.087859424920127,
"grad_norm": 0.8507115440982196,
"learning_rate": 8.439805945183333e-06,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772366404533386,
"step": 3185,
"valid_targets_mean": 2524.4,
"valid_targets_min": 852
},
{
"epoch": 5.095846645367412,
"grad_norm": 0.807103384546817,
"learning_rate": 8.374880514321318e-06,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27188539505004883,
"step": 3190,
"valid_targets_mean": 2683.4,
"valid_targets_min": 1022
},
{
"epoch": 5.103833865814696,
"grad_norm": 1.7728666178247663,
"learning_rate": 8.310139577800864e-06,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3083685636520386,
"step": 3195,
"valid_targets_mean": 3117.4,
"valid_targets_min": 1083
},
{
"epoch": 5.111821086261981,
"grad_norm": 0.8170861054810535,
"learning_rate": 8.245584163081228e-06,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28269141912460327,
"step": 3200,
"valid_targets_mean": 3077.5,
"valid_targets_min": 1317
},
{
"epoch": 5.119808306709265,
"grad_norm": 0.9004835635106335,
"learning_rate": 8.18121529467735e-06,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3067591190338135,
"step": 3205,
"valid_targets_mean": 3360.2,
"valid_targets_min": 1502
},
{
"epoch": 5.127795527156549,
"grad_norm": 0.7289161691303735,
"learning_rate": 8.117033994143635e-06,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269919216632843,
"step": 3210,
"valid_targets_mean": 3433.9,
"valid_targets_min": 1040
},
{
"epoch": 5.135782747603834,
"grad_norm": 0.8262371961557731,
"learning_rate": 8.053041280057733e-06,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30624669790267944,
"step": 3215,
"valid_targets_mean": 3221.0,
"valid_targets_min": 1568
},
{
"epoch": 5.143769968051118,
"grad_norm": 0.8907753230016606,
"learning_rate": 7.989238168004347e-06,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29566720128059387,
"step": 3220,
"valid_targets_mean": 2364.5,
"valid_targets_min": 964
},
{
"epoch": 5.151757188498403,
"grad_norm": 0.7773585981365254,
"learning_rate": 7.925625670559158e-06,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3160741925239563,
"step": 3225,
"valid_targets_mean": 3290.5,
"valid_targets_min": 816
},
{
"epoch": 5.159744408945687,
"grad_norm": 0.798268114199115,
"learning_rate": 7.862204797272716e-06,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718545198440552,
"step": 3230,
"valid_targets_mean": 3023.7,
"valid_targets_min": 357
},
{
"epoch": 5.167731629392971,
"grad_norm": 0.8348325476127518,
"learning_rate": 7.798976554654438e-06,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30119389295578003,
"step": 3235,
"valid_targets_mean": 2845.3,
"valid_targets_min": 1075
},
{
"epoch": 5.175718849840256,
"grad_norm": 0.8607243588387653,
"learning_rate": 7.73594194615663e-06,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3085380494594574,
"step": 3240,
"valid_targets_mean": 3279.1,
"valid_targets_min": 1584
},
{
"epoch": 5.18370607028754,
"grad_norm": 0.8423375550417697,
"learning_rate": 7.673101972158572e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27567416429519653,
"step": 3245,
"valid_targets_mean": 3083.5,
"valid_targets_min": 1024
},
{
"epoch": 5.1916932907348246,
"grad_norm": 0.852032784496535,
"learning_rate": 7.610457629950621e-06,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31364840269088745,
"step": 3250,
"valid_targets_mean": 2934.4,
"valid_targets_min": 812
},
{
"epoch": 5.199680511182109,
"grad_norm": 0.893030105220023,
"learning_rate": 7.548009913718402e-06,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30386775732040405,
"step": 3255,
"valid_targets_mean": 2715.1,
"valid_targets_min": 876
},
{
"epoch": 5.207667731629393,
"grad_norm": 0.8002908602580624,
"learning_rate": 7.485759814527034e-06,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22816193103790283,
"step": 3260,
"valid_targets_mean": 2609.4,
"valid_targets_min": 873
},
{
"epoch": 5.215654952076678,
"grad_norm": 0.8435557857370886,
"learning_rate": 7.423708320305361e-06,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3217226564884186,
"step": 3265,
"valid_targets_mean": 3110.6,
"valid_targets_min": 958
},
{
"epoch": 5.223642172523961,
"grad_norm": 0.8017066205902743,
"learning_rate": 7.361856415830335e-06,
"loss": 0.3095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31609028577804565,
"step": 3270,
"valid_targets_mean": 3048.7,
"valid_targets_min": 1242
},
{
"epoch": 5.231629392971246,
"grad_norm": 0.7893657441141547,
"learning_rate": 7.300205082711336e-06,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28325214982032776,
"step": 3275,
"valid_targets_mean": 2750.2,
"valid_targets_min": 949
},
{
"epoch": 5.23961661341853,
"grad_norm": 0.819627997431354,
"learning_rate": 7.2387552993746204e-06,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3147261440753937,
"step": 3280,
"valid_targets_mean": 3124.6,
"valid_targets_min": 1264
},
{
"epoch": 5.247603833865814,
"grad_norm": 0.9351538022500683,
"learning_rate": 7.177508041047769e-06,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2968599200248718,
"step": 3285,
"valid_targets_mean": 2553.6,
"valid_targets_min": 815
},
{
"epoch": 5.255591054313099,
"grad_norm": 0.7977468970245414,
"learning_rate": 7.116464279744262e-06,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29074782133102417,
"step": 3290,
"valid_targets_mean": 3356.4,
"valid_targets_min": 877
},
{
"epoch": 5.263578274760383,
"grad_norm": 1.0002932413081114,
"learning_rate": 7.055624984247977e-06,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29408007860183716,
"step": 3295,
"valid_targets_mean": 2184.9,
"valid_targets_min": 861
},
{
"epoch": 5.271565495207668,
"grad_norm": 0.8787187369922238,
"learning_rate": 6.9949911200978805e-06,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3129739463329315,
"step": 3300,
"valid_targets_mean": 2784.6,
"valid_targets_min": 1331
},
{
"epoch": 5.279552715654952,
"grad_norm": 0.7688302677974961,
"learning_rate": 6.934563649572678e-06,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3016201853752136,
"step": 3305,
"valid_targets_mean": 3469.8,
"valid_targets_min": 974
},
{
"epoch": 5.287539936102236,
"grad_norm": 0.9959524806904558,
"learning_rate": 6.874343531675521e-06,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28774166107177734,
"step": 3310,
"valid_targets_mean": 2686.1,
"valid_targets_min": 1122
},
{
"epoch": 5.295527156549521,
"grad_norm": 0.7733058351207257,
"learning_rate": 6.814331722118837e-06,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26841095089912415,
"step": 3315,
"valid_targets_mean": 3147.9,
"valid_targets_min": 970
},
{
"epoch": 5.303514376996805,
"grad_norm": 0.9011760987645664,
"learning_rate": 6.754529173309112e-06,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30054977536201477,
"step": 3320,
"valid_targets_mean": 3109.7,
"valid_targets_min": 1123
},
{
"epoch": 5.31150159744409,
"grad_norm": 0.9298325145703232,
"learning_rate": 6.694936834331809e-06,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050529956817627,
"step": 3325,
"valid_targets_mean": 2623.0,
"valid_targets_min": 1197
},
{
"epoch": 5.319488817891374,
"grad_norm": 1.064260914169855,
"learning_rate": 6.635555650936278e-06,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775145173072815,
"step": 3330,
"valid_targets_mean": 2871.4,
"valid_targets_min": 962
},
{
"epoch": 5.327476038338658,
"grad_norm": 1.0158736615306445,
"learning_rate": 6.576386565520794e-06,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29485511779785156,
"step": 3335,
"valid_targets_mean": 2650.2,
"valid_targets_min": 918
},
{
"epoch": 5.335463258785943,
"grad_norm": 0.870400658138986,
"learning_rate": 6.5174305171175336e-06,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30564117431640625,
"step": 3340,
"valid_targets_mean": 2673.1,
"valid_targets_min": 944
},
{
"epoch": 5.343450479233227,
"grad_norm": 0.9219545531854473,
"learning_rate": 6.458688441377734e-06,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3267873227596283,
"step": 3345,
"valid_targets_mean": 2452.8,
"valid_targets_min": 1007
},
{
"epoch": 5.3514376996805115,
"grad_norm": 0.8548078329069492,
"learning_rate": 6.400161270556817e-06,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32129526138305664,
"step": 3350,
"valid_targets_mean": 2940.7,
"valid_targets_min": 1154
},
{
"epoch": 5.359424920127796,
"grad_norm": 0.8829397660322249,
"learning_rate": 6.341849933499573e-06,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3029319941997528,
"step": 3355,
"valid_targets_mean": 2987.6,
"valid_targets_min": 1235
},
{
"epoch": 5.36741214057508,
"grad_norm": 0.8530974806686331,
"learning_rate": 6.283755355625472e-06,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870420217514038,
"step": 3360,
"valid_targets_mean": 2990.7,
"valid_targets_min": 1015
},
{
"epoch": 5.375399361022364,
"grad_norm": 0.9145905408930249,
"learning_rate": 6.225878458913917e-06,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793818414211273,
"step": 3365,
"valid_targets_mean": 2471.1,
"valid_targets_min": 1095
},
{
"epoch": 5.383386581469648,
"grad_norm": 0.8855698711753888,
"learning_rate": 6.168220161889678e-06,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34292152523994446,
"step": 3370,
"valid_targets_mean": 2997.3,
"valid_targets_min": 1237
},
{
"epoch": 5.391373801916933,
"grad_norm": 0.7349516509123469,
"learning_rate": 6.110781379608226e-06,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25433140993118286,
"step": 3375,
"valid_targets_mean": 3235.3,
"valid_targets_min": 1040
},
{
"epoch": 5.399361022364217,
"grad_norm": 1.0542744110852993,
"learning_rate": 6.053563023641318e-06,
"loss": 0.3057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38673511147499084,
"step": 3380,
"valid_targets_mean": 2352.1,
"valid_targets_min": 1110
},
{
"epoch": 5.407348242811501,
"grad_norm": 0.827121547272794,
"learning_rate": 5.996566002062439e-06,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31490558385849,
"step": 3385,
"valid_targets_mean": 2948.4,
"valid_targets_min": 1442
},
{
"epoch": 5.415335463258786,
"grad_norm": 0.8460018479986304,
"learning_rate": 5.939791219432442e-06,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29256829619407654,
"step": 3390,
"valid_targets_mean": 3162.4,
"valid_targets_min": 1461
},
{
"epoch": 5.42332268370607,
"grad_norm": 0.8344660862038872,
"learning_rate": 5.8832395767851846e-06,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2993561923503876,
"step": 3395,
"valid_targets_mean": 2604.9,
"valid_targets_min": 1357
},
{
"epoch": 5.431309904153355,
"grad_norm": 0.9435119676368734,
"learning_rate": 5.826911971613198e-06,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911856174468994,
"step": 3400,
"valid_targets_mean": 2483.8,
"valid_targets_min": 849
},
{
"epoch": 5.439297124600639,
"grad_norm": 0.8098232349422515,
"learning_rate": 5.770809297853495e-06,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26919856667518616,
"step": 3405,
"valid_targets_mean": 2917.8,
"valid_targets_min": 960
},
{
"epoch": 5.447284345047923,
"grad_norm": 0.862605956589078,
"learning_rate": 5.714932445873325e-06,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27299582958221436,
"step": 3410,
"valid_targets_mean": 2560.8,
"valid_targets_min": 1041
},
{
"epoch": 5.455271565495208,
"grad_norm": 0.9020710803465632,
"learning_rate": 5.659282302456115e-06,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.282878577709198,
"step": 3415,
"valid_targets_mean": 2509.6,
"valid_targets_min": 1406
},
{
"epoch": 5.463258785942492,
"grad_norm": 0.8669441953326755,
"learning_rate": 5.603859750787302e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26606321334838867,
"step": 3420,
"valid_targets_mean": 2598.4,
"valid_targets_min": 936
},
{
"epoch": 5.4712460063897765,
"grad_norm": 0.8752038102537848,
"learning_rate": 5.548665670440418e-06,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2888076603412628,
"step": 3425,
"valid_targets_mean": 2626.9,
"valid_targets_min": 1683
},
{
"epoch": 5.479233226837061,
"grad_norm": 0.8483698839811887,
"learning_rate": 5.4937009373630535e-06,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2613609731197357,
"step": 3430,
"valid_targets_mean": 2517.3,
"valid_targets_min": 1131
},
{
"epoch": 5.487220447284345,
"grad_norm": 0.8034035667215341,
"learning_rate": 5.438966423862997e-06,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635997533798218,
"step": 3435,
"valid_targets_mean": 3017.4,
"valid_targets_min": 1019
},
{
"epoch": 5.49520766773163,
"grad_norm": 0.8066653273398859,
"learning_rate": 5.384462998594384e-06,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26338884234428406,
"step": 3440,
"valid_targets_mean": 2630.4,
"valid_targets_min": 1079
},
{
"epoch": 5.503194888178914,
"grad_norm": 0.8323232685505498,
"learning_rate": 5.330191526543884e-06,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.288205087184906,
"step": 3445,
"valid_targets_mean": 2767.9,
"valid_targets_min": 1243
},
{
"epoch": 5.511182108626198,
"grad_norm": 1.046868167441267,
"learning_rate": 5.276152869017028e-06,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35603612661361694,
"step": 3450,
"valid_targets_mean": 2214.9,
"valid_targets_min": 1039
},
{
"epoch": 5.519169329073483,
"grad_norm": 0.8670390164428484,
"learning_rate": 5.22234788362447e-06,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28677263855934143,
"step": 3455,
"valid_targets_mean": 2610.7,
"valid_targets_min": 923
},
{
"epoch": 5.527156549520766,
"grad_norm": 0.953868413472568,
"learning_rate": 5.168777424268454e-06,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34387460350990295,
"step": 3460,
"valid_targets_mean": 2308.2,
"valid_targets_min": 1232
},
{
"epoch": 5.535143769968051,
"grad_norm": 0.8022290889230155,
"learning_rate": 5.115442341129171e-06,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.288701593875885,
"step": 3465,
"valid_targets_mean": 3129.0,
"valid_targets_min": 870
},
{
"epoch": 5.543130990415335,
"grad_norm": 0.8115409043956004,
"learning_rate": 5.062343480651364e-06,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29845625162124634,
"step": 3470,
"valid_targets_mean": 2757.8,
"valid_targets_min": 876
},
{
"epoch": 5.55111821086262,
"grad_norm": 0.7835197890738079,
"learning_rate": 5.009481685530817e-06,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28913915157318115,
"step": 3475,
"valid_targets_mean": 3522.1,
"valid_targets_min": 1068
},
{
"epoch": 5.559105431309904,
"grad_norm": 0.7660079313726896,
"learning_rate": 4.956857794701026e-06,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2907702624797821,
"step": 3480,
"valid_targets_mean": 3248.2,
"valid_targets_min": 1035
},
{
"epoch": 5.567092651757188,
"grad_norm": 0.8170731714868842,
"learning_rate": 4.904472643319873e-06,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2342405468225479,
"step": 3485,
"valid_targets_mean": 2918.7,
"valid_targets_min": 967
},
{
"epoch": 5.575079872204473,
"grad_norm": 0.8514738656541708,
"learning_rate": 4.852327062756352e-06,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788478136062622,
"step": 3490,
"valid_targets_mean": 2642.8,
"valid_targets_min": 1083
},
{
"epoch": 5.583067092651757,
"grad_norm": 0.9142924446585464,
"learning_rate": 4.800421880577411e-06,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2819330096244812,
"step": 3495,
"valid_targets_mean": 2215.6,
"valid_targets_min": 970
},
{
"epoch": 5.5910543130990416,
"grad_norm": 0.8351131614292047,
"learning_rate": 4.748757920534779e-06,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3117348551750183,
"step": 3500,
"valid_targets_mean": 2887.9,
"valid_targets_min": 1066
},
{
"epoch": 5.599041533546326,
"grad_norm": 0.878780990253628,
"learning_rate": 4.697336002551947e-06,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30660977959632874,
"step": 3505,
"valid_targets_mean": 2960.4,
"valid_targets_min": 1047
},
{
"epoch": 5.60702875399361,
"grad_norm": 0.9550316046064914,
"learning_rate": 4.6461569427110684e-06,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2975427508354187,
"step": 3510,
"valid_targets_mean": 2113.9,
"valid_targets_min": 1039
},
{
"epoch": 5.615015974440895,
"grad_norm": 0.8614684885214283,
"learning_rate": 4.5952215532401146e-06,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506102919578552,
"step": 3515,
"valid_targets_mean": 3007.6,
"valid_targets_min": 1284
},
{
"epoch": 5.623003194888179,
"grad_norm": 0.7055162824372356,
"learning_rate": 4.544530642499894e-06,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2834452688694,
"step": 3520,
"valid_targets_mean": 3786.9,
"valid_targets_min": 1342
},
{
"epoch": 5.6309904153354635,
"grad_norm": 0.9327473225687424,
"learning_rate": 4.4940850149712765e-06,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986459732055664,
"step": 3525,
"valid_targets_mean": 2386.1,
"valid_targets_min": 1204
},
{
"epoch": 5.638977635782748,
"grad_norm": 0.8782006771428341,
"learning_rate": 4.443885471242418e-06,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31005507707595825,
"step": 3530,
"valid_targets_mean": 2924.8,
"valid_targets_min": 640
},
{
"epoch": 5.646964856230032,
"grad_norm": 0.9010177674718335,
"learning_rate": 4.393932807996017e-06,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31273573637008667,
"step": 3535,
"valid_targets_mean": 3174.8,
"valid_targets_min": 998
},
{
"epoch": 5.654952076677317,
"grad_norm": 0.9330314923606065,
"learning_rate": 4.344227817996735e-06,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2842142581939697,
"step": 3540,
"valid_targets_mean": 2522.3,
"valid_targets_min": 1245
},
{
"epoch": 5.6629392971246,
"grad_norm": 0.8724285443483777,
"learning_rate": 4.294771290078548e-06,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26506611704826355,
"step": 3545,
"valid_targets_mean": 3159.2,
"valid_targets_min": 1330
},
{
"epoch": 5.6709265175718855,
"grad_norm": 0.8540186381544715,
"learning_rate": 4.245564009132293e-06,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010174036026001,
"step": 3550,
"valid_targets_mean": 2621.1,
"valid_targets_min": 947
},
{
"epoch": 5.678913738019169,
"grad_norm": 0.8410560464629185,
"learning_rate": 4.196606756093138e-06,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27265846729278564,
"step": 3555,
"valid_targets_mean": 2626.9,
"valid_targets_min": 981
},
{
"epoch": 5.686900958466453,
"grad_norm": 0.8063270462445804,
"learning_rate": 4.147900307928268e-06,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.302957147359848,
"step": 3560,
"valid_targets_mean": 3118.4,
"valid_targets_min": 883
},
{
"epoch": 5.694888178913738,
"grad_norm": 0.8910767531567404,
"learning_rate": 4.099445437624487e-06,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2881123125553131,
"step": 3565,
"valid_targets_mean": 2818.1,
"valid_targets_min": 1050
},
{
"epoch": 5.702875399361022,
"grad_norm": 0.9644419826076724,
"learning_rate": 4.051242914175995e-06,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3191588819026947,
"step": 3570,
"valid_targets_mean": 2307.6,
"valid_targets_min": 1330
},
{
"epoch": 5.710862619808307,
"grad_norm": 0.8825281014957341,
"learning_rate": 4.003293502572163e-06,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2749369144439697,
"step": 3575,
"valid_targets_mean": 2434.3,
"valid_targets_min": 924
},
{
"epoch": 5.718849840255591,
"grad_norm": 0.8149662345511066,
"learning_rate": 3.955597963785391e-06,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30972984433174133,
"step": 3580,
"valid_targets_mean": 3602.3,
"valid_targets_min": 1235
},
{
"epoch": 5.726837060702875,
"grad_norm": 0.8208308645247685,
"learning_rate": 3.908157054759048e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33973070979118347,
"step": 3585,
"valid_targets_mean": 3309.0,
"valid_targets_min": 1474
},
{
"epoch": 5.73482428115016,
"grad_norm": 1.2817350246441914,
"learning_rate": 3.860971528395427e-06,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.281210720539093,
"step": 3590,
"valid_targets_mean": 3072.1,
"valid_targets_min": 1051
},
{
"epoch": 5.742811501597444,
"grad_norm": 0.858260521624848,
"learning_rate": 3.814042133543847e-06,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29261261224746704,
"step": 3595,
"valid_targets_mean": 2800.6,
"valid_targets_min": 1520
},
{
"epoch": 5.7507987220447285,
"grad_norm": 0.8620084879239728,
"learning_rate": 3.7673696149887117e-06,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29667365550994873,
"step": 3600,
"valid_targets_mean": 2740.4,
"valid_targets_min": 1116
},
{
"epoch": 5.758785942492013,
"grad_norm": 0.8265698068500232,
"learning_rate": 3.72095471343773e-06,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3263239562511444,
"step": 3605,
"valid_targets_mean": 3160.9,
"valid_targets_min": 1162
},
{
"epoch": 5.766773162939297,
"grad_norm": 0.9027943191349252,
"learning_rate": 3.674798165510136e-06,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34345391392707825,
"step": 3610,
"valid_targets_mean": 3071.5,
"valid_targets_min": 888
},
{
"epoch": 5.774760383386582,
"grad_norm": 0.836591157500133,
"learning_rate": 3.6289007037250244e-06,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26754382252693176,
"step": 3615,
"valid_targets_mean": 2665.3,
"valid_targets_min": 1085
},
{
"epoch": 5.782747603833866,
"grad_norm": 0.9145676011202615,
"learning_rate": 3.5832630564897073e-06,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32892486453056335,
"step": 3620,
"valid_targets_mean": 2602.9,
"valid_targets_min": 769
},
{
"epoch": 5.7907348242811505,
"grad_norm": 0.7629854921736774,
"learning_rate": 3.5378859480881443e-06,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24377216398715973,
"step": 3625,
"valid_targets_mean": 3199.8,
"valid_targets_min": 811
},
{
"epoch": 5.798722044728435,
"grad_norm": 0.8042286264919823,
"learning_rate": 3.492770098669478e-06,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911136746406555,
"step": 3630,
"valid_targets_mean": 3393.9,
"valid_targets_min": 1265
},
{
"epoch": 5.806709265175719,
"grad_norm": 0.8369688623613801,
"learning_rate": 3.4479162242365717e-06,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27095547318458557,
"step": 3635,
"valid_targets_mean": 2753.4,
"valid_targets_min": 1154
},
{
"epoch": 5.814696485623003,
"grad_norm": 0.8947818480367905,
"learning_rate": 3.403325036634679e-06,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27299612760543823,
"step": 3640,
"valid_targets_mean": 2596.2,
"valid_targets_min": 1244
},
{
"epoch": 5.822683706070287,
"grad_norm": 0.8775169850347424,
"learning_rate": 3.3589972435401184e-06,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821030616760254,
"step": 3645,
"valid_targets_mean": 2154.2,
"valid_targets_min": 927
},
{
"epoch": 5.830670926517572,
"grad_norm": 0.9187215143961998,
"learning_rate": 3.3149335484490553e-06,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30498552322387695,
"step": 3650,
"valid_targets_mean": 2995.2,
"valid_targets_min": 1031
},
{
"epoch": 5.838658146964856,
"grad_norm": 0.7319498337703215,
"learning_rate": 3.2711346506663346e-06,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28768712282180786,
"step": 3655,
"valid_targets_mean": 3588.6,
"valid_targets_min": 2002
},
{
"epoch": 5.84664536741214,
"grad_norm": 0.8297441398475794,
"learning_rate": 3.2276012452943893e-06,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571295499801636,
"step": 3660,
"valid_targets_mean": 2946.4,
"valid_targets_min": 957
},
{
"epoch": 5.854632587859425,
"grad_norm": 0.9457931068247055,
"learning_rate": 3.1843340232222064e-06,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23238760232925415,
"step": 3665,
"valid_targets_mean": 2739.9,
"valid_targets_min": 848
},
{
"epoch": 5.862619808306709,
"grad_norm": 0.7880116160919101,
"learning_rate": 3.1413336711143437e-06,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2589631974697113,
"step": 3670,
"valid_targets_mean": 3419.8,
"valid_targets_min": 1110
},
{
"epoch": 5.8706070287539935,
"grad_norm": 0.8733165347603803,
"learning_rate": 3.0986008714000703e-06,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2866963744163513,
"step": 3675,
"valid_targets_mean": 2831.0,
"valid_targets_min": 1189
},
{
"epoch": 5.878594249201278,
"grad_norm": 0.9061936948826054,
"learning_rate": 3.056136302262489e-06,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2790377140045166,
"step": 3680,
"valid_targets_mean": 2385.3,
"valid_targets_min": 995
},
{
"epoch": 5.886581469648562,
"grad_norm": 0.7744924847924733,
"learning_rate": 3.0139406376278212e-06,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23188713192939758,
"step": 3685,
"valid_targets_mean": 3068.9,
"valid_targets_min": 1151
},
{
"epoch": 5.894568690095847,
"grad_norm": 0.8593959472274256,
"learning_rate": 2.972014547154671e-06,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28993451595306396,
"step": 3690,
"valid_targets_mean": 2661.4,
"valid_targets_min": 1105
},
{
"epoch": 5.902555910543131,
"grad_norm": 0.872637452202428,
"learning_rate": 2.930358696223423e-06,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856522500514984,
"step": 3695,
"valid_targets_mean": 2584.5,
"valid_targets_min": 1043
},
{
"epoch": 5.9105431309904155,
"grad_norm": 0.7625580478157692,
"learning_rate": 2.8889737459256695e-06,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512621581554413,
"step": 3700,
"valid_targets_mean": 3041.8,
"valid_targets_min": 810
},
{
"epoch": 5.9185303514377,
"grad_norm": 0.817825382177412,
"learning_rate": 2.8478603530537285e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.271395742893219,
"step": 3705,
"valid_targets_mean": 2701.8,
"valid_targets_min": 1104
},
{
"epoch": 5.926517571884984,
"grad_norm": 0.945231408750339,
"learning_rate": 2.8070191700902194e-06,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3027716875076294,
"step": 3710,
"valid_targets_mean": 2422.8,
"valid_targets_min": 866
},
{
"epoch": 5.934504792332269,
"grad_norm": 0.9458089413545945,
"learning_rate": 2.7664508451976903e-06,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904042899608612,
"step": 3715,
"valid_targets_mean": 2483.2,
"valid_targets_min": 898
},
{
"epoch": 5.942492012779553,
"grad_norm": 0.8523965806490982,
"learning_rate": 2.726156022208362e-06,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28088122606277466,
"step": 3720,
"valid_targets_mean": 2949.6,
"valid_targets_min": 666
},
{
"epoch": 5.950479233226837,
"grad_norm": 0.8763501591941483,
"learning_rate": 2.6861353406138713e-06,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27324312925338745,
"step": 3725,
"valid_targets_mean": 2387.6,
"valid_targets_min": 895
},
{
"epoch": 5.958466453674122,
"grad_norm": 0.878634194918592,
"learning_rate": 2.646389435555172e-06,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32627028226852417,
"step": 3730,
"valid_targets_mean": 3211.6,
"valid_targets_min": 891
},
{
"epoch": 5.966453674121405,
"grad_norm": 0.8672653374965403,
"learning_rate": 2.6069189378124015e-06,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31162893772125244,
"step": 3735,
"valid_targets_mean": 2756.2,
"valid_targets_min": 1049
},
{
"epoch": 5.97444089456869,
"grad_norm": 0.9052303395289947,
"learning_rate": 2.567724473794908e-06,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3283204436302185,
"step": 3740,
"valid_targets_mean": 2518.8,
"valid_targets_min": 949
},
{
"epoch": 5.982428115015974,
"grad_norm": 0.9078280494758757,
"learning_rate": 2.5288066655312914e-06,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921939492225647,
"step": 3745,
"valid_targets_mean": 2445.1,
"valid_targets_min": 1158
},
{
"epoch": 5.9904153354632586,
"grad_norm": 0.9142787916430909,
"learning_rate": 2.4901661306595414e-06,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3068923354148865,
"step": 3750,
"valid_targets_mean": 2726.0,
"valid_targets_min": 778
},
{
"epoch": 5.998402555910543,
"grad_norm": 0.8715476605369831,
"learning_rate": 2.451803482417234e-06,
"loss": 0.3183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3258388340473175,
"step": 3755,
"valid_targets_mean": 2622.8,
"valid_targets_min": 784
},
{
"epoch": 6.006389776357827,
"grad_norm": 0.8127550034791736,
"learning_rate": 2.413719329631785e-06,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275146484375,
"step": 3760,
"valid_targets_mean": 2720.4,
"valid_targets_min": 740
},
{
"epoch": 6.014376996805112,
"grad_norm": 0.8144087631669996,
"learning_rate": 2.375914276710811e-06,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2622288167476654,
"step": 3765,
"valid_targets_mean": 2943.3,
"valid_targets_min": 1245
},
{
"epoch": 6.022364217252396,
"grad_norm": 0.7721698190279348,
"learning_rate": 2.338388923632513e-06,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618906497955322,
"step": 3770,
"valid_targets_mean": 2792.1,
"valid_targets_min": 1287
},
{
"epoch": 6.0303514376996805,
"grad_norm": 0.8398697731858585,
"learning_rate": 2.3011438659361794e-06,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27312394976615906,
"step": 3775,
"valid_targets_mean": 2793.1,
"valid_targets_min": 1555
},
{
"epoch": 6.038338658146965,
"grad_norm": 0.8567900298455935,
"learning_rate": 2.2641796947127114e-06,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28074395656585693,
"step": 3780,
"valid_targets_mean": 2851.5,
"valid_targets_min": 964
},
{
"epoch": 6.046325878594249,
"grad_norm": 0.923861896817049,
"learning_rate": 2.2274969965952553e-06,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32039231061935425,
"step": 3785,
"valid_targets_mean": 2628.1,
"valid_targets_min": 1072
},
{
"epoch": 6.054313099041534,
"grad_norm": 0.8181909679032574,
"learning_rate": 2.1910963537498887e-06,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667577266693115,
"step": 3790,
"valid_targets_mean": 2870.7,
"valid_targets_min": 1164
},
{
"epoch": 6.062300319488818,
"grad_norm": 0.8109778169918753,
"learning_rate": 2.1549783438663872e-06,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527042627334595,
"step": 3795,
"valid_targets_mean": 3018.8,
"valid_targets_min": 1043
},
{
"epoch": 6.0702875399361025,
"grad_norm": 0.8499658360083157,
"learning_rate": 2.1191435401490534e-06,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25481629371643066,
"step": 3800,
"valid_targets_mean": 2641.6,
"valid_targets_min": 1046
},
{
"epoch": 6.078274760383387,
"grad_norm": 0.924864077463184,
"learning_rate": 2.0835925113076062e-06,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26144057512283325,
"step": 3805,
"valid_targets_mean": 2630.7,
"valid_targets_min": 1213
},
{
"epoch": 6.086261980830671,
"grad_norm": 0.8611502725518941,
"learning_rate": 2.0483258215481784e-06,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28638124465942383,
"step": 3810,
"valid_targets_mean": 2681.8,
"valid_targets_min": 915
},
{
"epoch": 6.094249201277956,
"grad_norm": 0.93643148378172,
"learning_rate": 2.0133440305643413e-06,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2659624218940735,
"step": 3815,
"valid_targets_mean": 2374.9,
"valid_targets_min": 1264
},
{
"epoch": 6.102236421725239,
"grad_norm": 0.9094153943052289,
"learning_rate": 1.9786476935282463e-06,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29782217741012573,
"step": 3820,
"valid_targets_mean": 2679.3,
"valid_targets_min": 1140
},
{
"epoch": 6.110223642172524,
"grad_norm": 0.8578921212730504,
"learning_rate": 1.944237361081782e-06,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30669862031936646,
"step": 3825,
"valid_targets_mean": 2931.2,
"valid_targets_min": 919
},
{
"epoch": 6.118210862619808,
"grad_norm": 0.8774447171982998,
"learning_rate": 1.9101135793278746e-06,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24913069605827332,
"step": 3830,
"valid_targets_mean": 2745.9,
"valid_targets_min": 1024
},
{
"epoch": 6.126198083067092,
"grad_norm": 0.8198399829117742,
"learning_rate": 1.8762768898217732e-06,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930334806442261,
"step": 3835,
"valid_targets_mean": 2795.0,
"valid_targets_min": 747
},
{
"epoch": 6.134185303514377,
"grad_norm": 0.6701701605321356,
"learning_rate": 1.8427278295625006e-06,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23434777557849884,
"step": 3840,
"valid_targets_mean": 3436.4,
"valid_targets_min": 1204
},
{
"epoch": 6.142172523961661,
"grad_norm": 1.0174049901842122,
"learning_rate": 1.8094669309843161e-06,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28728413581848145,
"step": 3845,
"valid_targets_mean": 2038.7,
"valid_targets_min": 1061
},
{
"epoch": 6.1501597444089455,
"grad_norm": 0.7377419451238836,
"learning_rate": 1.776494721948241e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26700955629348755,
"step": 3850,
"valid_targets_mean": 3754.7,
"valid_targets_min": 1146
},
{
"epoch": 6.15814696485623,
"grad_norm": 0.8809290165165347,
"learning_rate": 1.7438117257337239e-06,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22705921530723572,
"step": 3855,
"valid_targets_mean": 2662.8,
"valid_targets_min": 944
},
{
"epoch": 6.166134185303514,
"grad_norm": 0.8531110330155715,
"learning_rate": 1.7114184610302964e-06,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27642789483070374,
"step": 3860,
"valid_targets_mean": 3141.9,
"valid_targets_min": 1396
},
{
"epoch": 6.174121405750799,
"grad_norm": 0.7792356842403435,
"learning_rate": 1.67931544192937e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26689833402633667,
"step": 3865,
"valid_targets_mean": 3185.1,
"valid_targets_min": 1228
},
{
"epoch": 6.182108626198083,
"grad_norm": 0.932186250287318,
"learning_rate": 1.6475031779160611e-06,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29413291811943054,
"step": 3870,
"valid_targets_mean": 2828.4,
"valid_targets_min": 817
},
{
"epoch": 6.1900958466453675,
"grad_norm": 0.9999872211296582,
"learning_rate": 1.6159821738611192e-06,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3073047697544098,
"step": 3875,
"valid_targets_mean": 2609.2,
"valid_targets_min": 1015
},
{
"epoch": 6.198083067092652,
"grad_norm": 0.8522969496137042,
"learning_rate": 1.5847529300128827e-06,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2496946156024933,
"step": 3880,
"valid_targets_mean": 2715.8,
"valid_targets_min": 947
},
{
"epoch": 6.206070287539936,
"grad_norm": 0.8205921714964237,
"learning_rate": 1.5538159419893895e-06,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3144986629486084,
"step": 3885,
"valid_targets_mean": 3409.3,
"valid_targets_min": 1203
},
{
"epoch": 6.214057507987221,
"grad_norm": 1.0161305576290838,
"learning_rate": 1.5231717007704738e-06,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28573137521743774,
"step": 3890,
"valid_targets_mean": 2113.8,
"valid_targets_min": 671
},
{
"epoch": 6.222044728434505,
"grad_norm": 0.8504064835959527,
"learning_rate": 1.4928206926899801e-06,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27324777841567993,
"step": 3895,
"valid_targets_mean": 2668.8,
"valid_targets_min": 876
},
{
"epoch": 6.2300319488817895,
"grad_norm": 0.8751818535512605,
"learning_rate": 1.4627633994280599e-06,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3199600577354431,
"step": 3900,
"valid_targets_mean": 2899.5,
"valid_targets_min": 1095
},
{
"epoch": 6.238019169329074,
"grad_norm": 0.8728480586187728,
"learning_rate": 1.433000298003504e-06,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25064951181411743,
"step": 3905,
"valid_targets_mean": 3270.7,
"valid_targets_min": 1027
},
{
"epoch": 6.246006389776358,
"grad_norm": 0.7665455493403013,
"learning_rate": 1.4035318607662029e-06,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28335410356521606,
"step": 3910,
"valid_targets_mean": 3683.3,
"valid_targets_min": 1096
},
{
"epoch": 6.253993610223642,
"grad_norm": 0.7720218615283687,
"learning_rate": 1.3743585553896144e-06,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29515159130096436,
"step": 3915,
"valid_targets_mean": 3592.1,
"valid_targets_min": 1158
},
{
"epoch": 6.261980830670926,
"grad_norm": 0.9127307390415227,
"learning_rate": 1.345480844863376e-06,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.280670166015625,
"step": 3920,
"valid_targets_mean": 2674.4,
"valid_targets_min": 1174
},
{
"epoch": 6.2699680511182105,
"grad_norm": 0.8744155416369218,
"learning_rate": 1.316899187485925e-06,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26286551356315613,
"step": 3925,
"valid_targets_mean": 2467.4,
"valid_targets_min": 1295
},
{
"epoch": 6.277955271565495,
"grad_norm": 1.0050448884691408,
"learning_rate": 1.288614036857252e-06,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2835194766521454,
"step": 3930,
"valid_targets_mean": 2397.7,
"valid_targets_min": 613
},
{
"epoch": 6.285942492012779,
"grad_norm": 1.073465147880673,
"learning_rate": 1.260625841871692e-06,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30487751960754395,
"step": 3935,
"valid_targets_mean": 1912.4,
"valid_targets_min": 784
},
{
"epoch": 6.293929712460064,
"grad_norm": 0.9475913607873788,
"learning_rate": 1.2329350467107925e-06,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3098008334636688,
"step": 3940,
"valid_targets_mean": 2448.3,
"valid_targets_min": 1050
},
{
"epoch": 6.301916932907348,
"grad_norm": 0.8134903936892746,
"learning_rate": 1.2055420908362781e-06,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2720017433166504,
"step": 3945,
"valid_targets_mean": 2767.9,
"valid_targets_min": 681
},
{
"epoch": 6.3099041533546325,
"grad_norm": 0.8888924414509212,
"learning_rate": 1.1784474089830612e-06,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28785115480422974,
"step": 3950,
"valid_targets_mean": 2391.2,
"valid_targets_min": 1345
},
{
"epoch": 6.317891373801917,
"grad_norm": 0.86398511760062,
"learning_rate": 1.1516514311523607e-06,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3019968271255493,
"step": 3955,
"valid_targets_mean": 3056.1,
"valid_targets_min": 1161
},
{
"epoch": 6.325878594249201,
"grad_norm": 0.9214178738753978,
"learning_rate": 1.1251545826048593e-06,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911544442176819,
"step": 3960,
"valid_targets_mean": 2535.8,
"valid_targets_min": 938
},
{
"epoch": 6.333865814696486,
"grad_norm": 0.865667826552045,
"learning_rate": 1.098957283853972e-06,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934360206127167,
"step": 3965,
"valid_targets_mean": 2922.7,
"valid_targets_min": 1151
},
{
"epoch": 6.34185303514377,
"grad_norm": 0.7197667191842236,
"learning_rate": 1.0730599506591476e-06,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2684939503669739,
"step": 3970,
"valid_targets_mean": 3498.9,
"valid_targets_min": 1109
},
{
"epoch": 6.3498402555910545,
"grad_norm": 1.0547057892528122,
"learning_rate": 1.0474629940192994e-06,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28599128127098083,
"step": 3975,
"valid_targets_mean": 2373.9,
"valid_targets_min": 981
},
{
"epoch": 6.357827476038339,
"grad_norm": 0.7493494299222992,
"learning_rate": 1.0221668201662726e-06,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27192163467407227,
"step": 3980,
"valid_targets_mean": 3340.1,
"valid_targets_min": 933
},
{
"epoch": 6.365814696485623,
"grad_norm": 0.8997567714591271,
"learning_rate": 9.971718305583767e-07,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30002540349960327,
"step": 3985,
"valid_targets_mean": 2738.8,
"valid_targets_min": 905
},
{
"epoch": 6.373801916932908,
"grad_norm": 0.8866650690614957,
"learning_rate": 9.724784218740524e-07,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28500303626060486,
"step": 3990,
"valid_targets_mean": 2653.4,
"valid_targets_min": 811
},
{
"epoch": 6.381789137380192,
"grad_norm": 0.9347856270629038,
"learning_rate": 9.480869860055364e-07,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27928462624549866,
"step": 3995,
"valid_targets_mean": 2648.6,
"valid_targets_min": 617
},
{
"epoch": 6.389776357827476,
"grad_norm": 1.0017367851930086,
"learning_rate": 9.239979100526763e-07,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29938584566116333,
"step": 4000,
"valid_targets_mean": 2246.9,
"valid_targets_min": 993
},
{
"epoch": 6.397763578274761,
"grad_norm": 0.8659652867802654,
"learning_rate": 9.002115763167585e-07,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3003730773925781,
"step": 4005,
"valid_targets_mean": 2882.9,
"valid_targets_min": 1010
},
{
"epoch": 6.405750798722044,
"grad_norm": 0.9034083580157991,
"learning_rate": 8.7672836229447e-07,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2945745289325714,
"step": 4010,
"valid_targets_mean": 2482.9,
"valid_targets_min": 1156
},
{
"epoch": 6.413738019169329,
"grad_norm": 0.8927648422059912,
"learning_rate": 8.535486406718684e-07,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2580193877220154,
"step": 4015,
"valid_targets_mean": 2508.5,
"valid_targets_min": 763
},
{
"epoch": 6.421725239616613,
"grad_norm": 0.9879607023550055,
"learning_rate": 8.306727793185132e-07,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2995275557041168,
"step": 4020,
"valid_targets_mean": 2534.1,
"valid_targets_min": 1082
},
{
"epoch": 6.4297124600638975,
"grad_norm": 0.7936525585301886,
"learning_rate": 8.081011412815965e-07,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29689520597457886,
"step": 4025,
"valid_targets_mean": 4021.8,
"valid_targets_min": 1473
},
{
"epoch": 6.437699680511182,
"grad_norm": 0.8966996505296543,
"learning_rate": 7.858340847801815e-07,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32515469193458557,
"step": 4030,
"valid_targets_mean": 2741.1,
"valid_targets_min": 1039
},
{
"epoch": 6.445686900958466,
"grad_norm": 1.0500500173826224,
"learning_rate": 7.638719631995406e-07,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28945955634117126,
"step": 4035,
"valid_targets_mean": 2265.1,
"valid_targets_min": 797
},
{
"epoch": 6.453674121405751,
"grad_norm": 0.7971219075331492,
"learning_rate": 7.422151250855214e-07,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784157693386078,
"step": 4040,
"valid_targets_mean": 3321.6,
"valid_targets_min": 1364
},
{
"epoch": 6.461661341853035,
"grad_norm": 0.8249509940299007,
"learning_rate": 7.208639141390295e-07,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2764117121696472,
"step": 4045,
"valid_targets_mean": 2801.1,
"valid_targets_min": 1112
},
{
"epoch": 6.4696485623003195,
"grad_norm": 0.6754399283991835,
"learning_rate": 6.998186692105657e-07,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3034869134426117,
"step": 4050,
"valid_targets_mean": 4446.3,
"valid_targets_min": 1249
},
{
"epoch": 6.477635782747604,
"grad_norm": 0.8541733280528224,
"learning_rate": 6.790797242948644e-07,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28104281425476074,
"step": 4055,
"valid_targets_mean": 2924.0,
"valid_targets_min": 1210
},
{
"epoch": 6.485623003194888,
"grad_norm": 0.8991862823370763,
"learning_rate": 6.5864740852557e-07,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29677364230155945,
"step": 4060,
"valid_targets_mean": 2876.8,
"valid_targets_min": 1021
},
{
"epoch": 6.493610223642173,
"grad_norm": 0.923502088444072,
"learning_rate": 6.385220461700248e-07,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2582230865955353,
"step": 4065,
"valid_targets_mean": 2419.9,
"valid_targets_min": 1113
},
{
"epoch": 6.501597444089457,
"grad_norm": 0.8923137741720667,
"learning_rate": 6.187039566241337e-07,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29919350147247314,
"step": 4070,
"valid_targets_mean": 2512.4,
"valid_targets_min": 1190
},
{
"epoch": 6.5095846645367414,
"grad_norm": 0.947003285788988,
"learning_rate": 5.99193454407272e-07,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25678086280822754,
"step": 4075,
"valid_targets_mean": 2908.8,
"valid_targets_min": 852
},
{
"epoch": 6.517571884984026,
"grad_norm": 0.9290365545693675,
"learning_rate": 5.799908491573148e-07,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2681635618209839,
"step": 4080,
"valid_targets_mean": 2875.2,
"valid_targets_min": 1035
},
{
"epoch": 6.52555910543131,
"grad_norm": 0.8055510758263922,
"learning_rate": 5.610964456257107e-07,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3032207787036896,
"step": 4085,
"valid_targets_mean": 3016.1,
"valid_targets_min": 860
},
{
"epoch": 6.533546325878595,
"grad_norm": 0.8661559196905022,
"learning_rate": 5.425105436726496e-07,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192429542541504,
"step": 4090,
"valid_targets_mean": 3199.2,
"valid_targets_min": 1193
},
{
"epoch": 6.541533546325878,
"grad_norm": 0.8334359620774163,
"learning_rate": 5.242334382623004e-07,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644953727722168,
"step": 4095,
"valid_targets_mean": 2952.7,
"valid_targets_min": 1006
},
{
"epoch": 6.549520766773163,
"grad_norm": 0.8345711981656436,
"learning_rate": 5.062654194581429e-07,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751539349555969,
"step": 4100,
"valid_targets_mean": 2936.6,
"valid_targets_min": 1057
},
{
"epoch": 6.557507987220447,
"grad_norm": 0.8249390721549272,
"learning_rate": 4.88606772418343e-07,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27628517150878906,
"step": 4105,
"valid_targets_mean": 3009.9,
"valid_targets_min": 1232
},
{
"epoch": 6.565495207667731,
"grad_norm": 0.8906179256977498,
"learning_rate": 4.7125777739123857e-07,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26204580068588257,
"step": 4110,
"valid_targets_mean": 2616.2,
"valid_targets_min": 786
},
{
"epoch": 6.573482428115016,
"grad_norm": 0.9564767125815427,
"learning_rate": 4.54218709710903e-07,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27267003059387207,
"step": 4115,
"valid_targets_mean": 2530.6,
"valid_targets_min": 835
},
{
"epoch": 6.5814696485623,
"grad_norm": 1.0097256008643347,
"learning_rate": 4.374898397927507e-07,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.280648410320282,
"step": 4120,
"valid_targets_mean": 2028.9,
"valid_targets_min": 879
},
{
"epoch": 6.5894568690095845,
"grad_norm": 0.7910653764082966,
"learning_rate": 4.210714331292698e-07,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25909939408302307,
"step": 4125,
"valid_targets_mean": 3639.0,
"valid_targets_min": 640
},
{
"epoch": 6.597444089456869,
"grad_norm": 0.8967697560189001,
"learning_rate": 4.049637502857895e-07,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31095483899116516,
"step": 4130,
"valid_targets_mean": 2755.9,
"valid_targets_min": 1118
},
{
"epoch": 6.605431309904153,
"grad_norm": 0.8044131928051629,
"learning_rate": 3.8916704689635707e-07,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26935964822769165,
"step": 4135,
"valid_targets_mean": 3220.1,
"valid_targets_min": 715
},
{
"epoch": 6.613418530351438,
"grad_norm": 0.9486702138753735,
"learning_rate": 3.736815736596766e-07,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.262970507144928,
"step": 4140,
"valid_targets_mean": 2247.6,
"valid_targets_min": 1247
},
{
"epoch": 6.621405750798722,
"grad_norm": 0.9444733020979281,
"learning_rate": 3.5850757633513424e-07,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2954460382461548,
"step": 4145,
"valid_targets_mean": 2492.8,
"valid_targets_min": 960
},
{
"epoch": 6.6293929712460065,
"grad_norm": 0.8264663607471652,
"learning_rate": 3.4364529573888803e-07,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821193337440491,
"step": 4150,
"valid_targets_mean": 3666.4,
"valid_targets_min": 1362
},
{
"epoch": 6.637380191693291,
"grad_norm": 0.7883252732780124,
"learning_rate": 3.2909496774005344e-07,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24705815315246582,
"step": 4155,
"valid_targets_mean": 3010.6,
"valid_targets_min": 760
},
{
"epoch": 6.645367412140575,
"grad_norm": 0.8581251837834798,
"learning_rate": 3.14856823256966e-07,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2624890208244324,
"step": 4160,
"valid_targets_mean": 2668.6,
"valid_targets_min": 1019
},
{
"epoch": 6.65335463258786,
"grad_norm": 0.8240095528399365,
"learning_rate": 3.009310882534999e-07,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29036304354667664,
"step": 4165,
"valid_targets_mean": 2824.6,
"valid_targets_min": 963
},
{
"epoch": 6.661341853035144,
"grad_norm": 0.7516190273322936,
"learning_rate": 2.8731798373550004e-07,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25370168685913086,
"step": 4170,
"valid_targets_mean": 3306.3,
"valid_targets_min": 1047
},
{
"epoch": 6.669329073482428,
"grad_norm": 0.9547075812225164,
"learning_rate": 2.740177257472576e-07,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3222120404243469,
"step": 4175,
"valid_targets_mean": 2726.6,
"valid_targets_min": 1220
},
{
"epoch": 6.677316293929713,
"grad_norm": 0.9147687950227396,
"learning_rate": 2.6103052536810226e-07,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2797955274581909,
"step": 4180,
"valid_targets_mean": 2509.3,
"valid_targets_min": 1157
},
{
"epoch": 6.685303514376997,
"grad_norm": 0.9628729966351203,
"learning_rate": 2.4835658870902226e-07,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3168693780899048,
"step": 4185,
"valid_targets_mean": 2480.8,
"valid_targets_min": 891
},
{
"epoch": 6.693290734824281,
"grad_norm": 0.9351117480178864,
"learning_rate": 2.3599611690943158e-07,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3047877848148346,
"step": 4190,
"valid_targets_mean": 2964.2,
"valid_targets_min": 1300
},
{
"epoch": 6.701277955271565,
"grad_norm": 1.0413196442161707,
"learning_rate": 2.2394930613393927e-07,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2819758653640747,
"step": 4195,
"valid_targets_mean": 2164.5,
"valid_targets_min": 881
},
{
"epoch": 6.7092651757188495,
"grad_norm": 0.8822261803756162,
"learning_rate": 2.122163475692629e-07,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054836392402649,
"step": 4200,
"valid_targets_mean": 2828.2,
"valid_targets_min": 747
},
{
"epoch": 6.717252396166134,
"grad_norm": 1.3216177064624284,
"learning_rate": 2.0079742742118878e-07,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2610338032245636,
"step": 4205,
"valid_targets_mean": 3650.8,
"valid_targets_min": 1250
},
{
"epoch": 6.725239616613418,
"grad_norm": 0.9383861038544505,
"learning_rate": 1.8969272691160334e-07,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30719295144081116,
"step": 4210,
"valid_targets_mean": 2418.2,
"valid_targets_min": 1321
},
{
"epoch": 6.733226837060703,
"grad_norm": 0.8409922729450794,
"learning_rate": 1.789024222756397e-07,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.265010803937912,
"step": 4215,
"valid_targets_mean": 3095.4,
"valid_targets_min": 1215
},
{
"epoch": 6.741214057507987,
"grad_norm": 0.7495800721357617,
"learning_rate": 1.6842668475885782e-07,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3141767978668213,
"step": 4220,
"valid_targets_mean": 4236.1,
"valid_targets_min": 1231
},
{
"epoch": 6.7492012779552715,
"grad_norm": 0.8522557539051201,
"learning_rate": 1.582656806145444e-07,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2988400459289551,
"step": 4225,
"valid_targets_mean": 3127.9,
"valid_targets_min": 1049
},
{
"epoch": 6.757188498402556,
"grad_norm": 0.9893507336164773,
"learning_rate": 1.4841957110106388e-07,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28573116660118103,
"step": 4230,
"valid_targets_mean": 2120.6,
"valid_targets_min": 925
},
{
"epoch": 6.76517571884984,
"grad_norm": 0.9491247142208109,
"learning_rate": 1.388885124793049e-07,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31920358538627625,
"step": 4235,
"valid_targets_mean": 2578.9,
"valid_targets_min": 1035
},
{
"epoch": 6.773162939297125,
"grad_norm": 0.7611128237185949,
"learning_rate": 1.2967265601019573e-07,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2846299409866333,
"step": 4240,
"valid_targets_mean": 3655.2,
"valid_targets_min": 1028
},
{
"epoch": 6.781150159744409,
"grad_norm": 0.9210913647426122,
"learning_rate": 1.207721479523105e-07,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35080933570861816,
"step": 4245,
"valid_targets_mean": 2840.4,
"valid_targets_min": 1261
},
{
"epoch": 6.789137380191693,
"grad_norm": 1.721647903989534,
"learning_rate": 1.1218712955954003e-07,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759488821029663,
"step": 4250,
"valid_targets_mean": 2726.2,
"valid_targets_min": 1174
},
{
"epoch": 6.797124600638978,
"grad_norm": 0.8118881713456394,
"learning_rate": 1.0391773707885578e-07,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3287505507469177,
"step": 4255,
"valid_targets_mean": 3890.9,
"valid_targets_min": 1776
},
{
"epoch": 6.805111821086262,
"grad_norm": 1.0237761097745328,
"learning_rate": 9.596410174814497e-08,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3121640682220459,
"step": 4260,
"valid_targets_mean": 2273.5,
"valid_targets_min": 985
},
{
"epoch": 6.813099041533547,
"grad_norm": 0.8756144489602926,
"learning_rate": 8.83263497941278e-08,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863563895225525,
"step": 4265,
"valid_targets_mean": 3378.8,
"valid_targets_min": 1177
},
{
"epoch": 6.821086261980831,
"grad_norm": 0.9055578315212417,
"learning_rate": 8.10046024303568e-08,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192518949508667,
"step": 4270,
"valid_targets_mean": 2526.4,
"valid_targets_min": 866
},
{
"epoch": 6.8290734824281145,
"grad_norm": 0.828803979329337,
"learning_rate": 7.399897585528726e-08,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275405615568161,
"step": 4275,
"valid_targets_mean": 3092.6,
"valid_targets_min": 1241
},
{
"epoch": 6.8370607028754,
"grad_norm": 0.8196124102717052,
"learning_rate": 6.730958125044319e-08,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27911484241485596,
"step": 4280,
"valid_targets_mean": 3558.2,
"valid_targets_min": 1120
},
{
"epoch": 6.845047923322683,
"grad_norm": 0.8901874965419135,
"learning_rate": 6.093652477864309e-08,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26097339391708374,
"step": 4285,
"valid_targets_mean": 3068.0,
"valid_targets_min": 1169
},
{
"epoch": 6.853035143769968,
"grad_norm": 0.8655935287765495,
"learning_rate": 5.4879907582316986e-08,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2756623923778534,
"step": 4290,
"valid_targets_mean": 3080.9,
"valid_targets_min": 1257
},
{
"epoch": 6.861022364217252,
"grad_norm": 0.7648381612652023,
"learning_rate": 4.913982578190535e-08,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2539091110229492,
"step": 4295,
"valid_targets_mean": 3344.6,
"valid_targets_min": 1276
},
{
"epoch": 6.8690095846645365,
"grad_norm": 0.8390658265719673,
"learning_rate": 4.3716370474331527e-08,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36022868752479553,
"step": 4300,
"valid_targets_mean": 2998.6,
"valid_targets_min": 1162
},
{
"epoch": 6.876996805111821,
"grad_norm": 0.8055876615636595,
"learning_rate": 3.8609627731558405e-08,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24102458357810974,
"step": 4305,
"valid_targets_mean": 3242.4,
"valid_targets_min": 1254
},
{
"epoch": 6.884984025559105,
"grad_norm": 0.9539831877236683,
"learning_rate": 3.381967859920954e-08,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2361864149570465,
"step": 4310,
"valid_targets_mean": 2221.6,
"valid_targets_min": 1262
},
{
"epoch": 6.89297124600639,
"grad_norm": 0.9029039854454836,
"learning_rate": 2.9346599095305685e-08,
"loss": 0.2756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3124200999736786,
"step": 4315,
"valid_targets_mean": 3012.0,
"valid_targets_min": 1108
},
{
"epoch": 6.900958466453674,
"grad_norm": 0.9294252530003244,
"learning_rate": 2.5190460209039146e-08,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320919394493103,
"step": 4320,
"valid_targets_mean": 2418.2,
"valid_targets_min": 1051
},
{
"epoch": 6.9089456869009584,
"grad_norm": 0.8167670634707263,
"learning_rate": 2.1351327899656883e-08,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3053489923477173,
"step": 4325,
"valid_targets_mean": 3051.6,
"valid_targets_min": 1233
},
{
"epoch": 6.916932907348243,
"grad_norm": 0.891874638674044,
"learning_rate": 1.782926309540578e-08,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3282131850719452,
"step": 4330,
"valid_targets_mean": 2809.9,
"valid_targets_min": 1303
},
{
"epoch": 6.924920127795527,
"grad_norm": 0.8436959953986517,
"learning_rate": 1.462432169257344e-08,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2719654440879822,
"step": 4335,
"valid_targets_mean": 3073.7,
"valid_targets_min": 1214
},
{
"epoch": 6.932907348242812,
"grad_norm": 0.8769982264320124,
"learning_rate": 1.1736554554604429e-08,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28453394770622253,
"step": 4340,
"valid_targets_mean": 2600.9,
"valid_targets_min": 1517
},
{
"epoch": 6.940894568690096,
"grad_norm": 0.799917953202752,
"learning_rate": 9.166007511274278e-09,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3287510871887207,
"step": 4345,
"valid_targets_mean": 3648.2,
"valid_targets_min": 873
},
{
"epoch": 6.94888178913738,
"grad_norm": 0.9188207110001246,
"learning_rate": 6.912721357985597e-09,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2823947072029114,
"step": 4350,
"valid_targets_mean": 2750.2,
"valid_targets_min": 1078
},
{
"epoch": 6.956869009584665,
"grad_norm": 0.8966652036625243,
"learning_rate": 4.976731855104166e-09,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2613156735897064,
"step": 4355,
"valid_targets_mean": 2528.8,
"valid_targets_min": 909
},
{
"epoch": 6.964856230031949,
"grad_norm": 0.9156629228599535,
"learning_rate": 3.3580697274016028e-09,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30315962433815,
"step": 4360,
"valid_targets_mean": 2685.6,
"valid_targets_min": 1197
},
{
"epoch": 6.972843450479234,
"grad_norm": 0.7280740965258752,
"learning_rate": 2.056760663555757e-09,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2657495141029358,
"step": 4365,
"valid_targets_mean": 3746.4,
"valid_targets_min": 1229
},
{
"epoch": 6.980830670926517,
"grad_norm": 0.9132105098927803,
"learning_rate": 1.0728253157599178e-09,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305087685585022,
"step": 4370,
"valid_targets_mean": 2696.9,
"valid_targets_min": 657
},
{
"epoch": 6.988817891373802,
"grad_norm": 0.8569350748102568,
"learning_rate": 4.062792993786424e-10,
"loss": 0.2613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24934561550617218,
"step": 4375,
"valid_targets_mean": 2357.8,
"valid_targets_min": 919
},
{
"epoch": 6.996805111821086,
"grad_norm": 0.9999686364147095,
"learning_rate": 5.7133192707947705e-11,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2727892994880676,
"step": 4380,
"valid_targets_mean": 2353.3,
"valid_targets_min": 1390
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24196135997772217,
"step": 4382,
"total_flos": 881525354463232.0,
"train_loss": 0.37171825520364404,
"train_runtime": 19745.0516,
"train_samples_per_second": 3.548,
"train_steps_per_second": 0.222,
"valid_targets_mean": 3242.5,
"valid_targets_min": 1195
}
],
"logging_steps": 5,
"max_steps": 4382,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 881525354463232.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}