Files
a1-defects4j/trainer_state.json
ModelHub XC 2aa8043d40 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-defects4j
Source: Original Platform
2026-05-13 15:07:21 +08:00

9673 lines
258 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4375,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008,
"grad_norm": 29.0015320167095,
"learning_rate": 3.6529680365296803e-07,
"loss": 0.9436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9374949932098389,
"step": 5,
"valid_targets_mean": 5346.2,
"valid_targets_min": 1863
},
{
"epoch": 0.016,
"grad_norm": 28.785647078426567,
"learning_rate": 8.219178082191781e-07,
"loss": 0.9171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9532188177108765,
"step": 10,
"valid_targets_mean": 5302.2,
"valid_targets_min": 2130
},
{
"epoch": 0.024,
"grad_norm": 26.616351818564006,
"learning_rate": 1.278538812785388e-06,
"loss": 0.9016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8873691558837891,
"step": 15,
"valid_targets_mean": 5041.2,
"valid_targets_min": 1753
},
{
"epoch": 0.032,
"grad_norm": 18.931940149483303,
"learning_rate": 1.7351598173515982e-06,
"loss": 0.8321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8346962928771973,
"step": 20,
"valid_targets_mean": 5056.3,
"valid_targets_min": 1670
},
{
"epoch": 0.04,
"grad_norm": 9.219256821460794,
"learning_rate": 2.191780821917808e-06,
"loss": 0.7515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7757815718650818,
"step": 25,
"valid_targets_mean": 5699.4,
"valid_targets_min": 3462
},
{
"epoch": 0.048,
"grad_norm": 4.729746039956276,
"learning_rate": 2.6484018264840183e-06,
"loss": 0.7129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6848674416542053,
"step": 30,
"valid_targets_mean": 6168.1,
"valid_targets_min": 3152
},
{
"epoch": 0.056,
"grad_norm": 2.4602603161083585,
"learning_rate": 3.1050228310502285e-06,
"loss": 0.6598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6890764236450195,
"step": 35,
"valid_targets_mean": 7148.6,
"valid_targets_min": 783
},
{
"epoch": 0.064,
"grad_norm": 1.8763042005789952,
"learning_rate": 3.5616438356164386e-06,
"loss": 0.6163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6118077635765076,
"step": 40,
"valid_targets_mean": 5883.2,
"valid_targets_min": 2516
},
{
"epoch": 0.072,
"grad_norm": 1.602650359787958,
"learning_rate": 4.018264840182649e-06,
"loss": 0.6138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5972576141357422,
"step": 45,
"valid_targets_mean": 5523.7,
"valid_targets_min": 1938
},
{
"epoch": 0.08,
"grad_norm": 1.4500272948050443,
"learning_rate": 4.4748858447488585e-06,
"loss": 0.5783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.544214129447937,
"step": 50,
"valid_targets_mean": 5985.9,
"valid_targets_min": 2378
},
{
"epoch": 0.088,
"grad_norm": 1.009096494436647,
"learning_rate": 4.931506849315069e-06,
"loss": 0.5743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.567956805229187,
"step": 55,
"valid_targets_mean": 5316.4,
"valid_targets_min": 2034
},
{
"epoch": 0.096,
"grad_norm": 0.8031284787989955,
"learning_rate": 5.388127853881279e-06,
"loss": 0.5495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5508638620376587,
"step": 60,
"valid_targets_mean": 5330.8,
"valid_targets_min": 2818
},
{
"epoch": 0.104,
"grad_norm": 0.757836297686658,
"learning_rate": 5.8447488584474885e-06,
"loss": 0.5469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5989420413970947,
"step": 65,
"valid_targets_mean": 6095.4,
"valid_targets_min": 965
},
{
"epoch": 0.112,
"grad_norm": 0.6744715206516015,
"learning_rate": 6.301369863013699e-06,
"loss": 0.5404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5301568508148193,
"step": 70,
"valid_targets_mean": 5555.2,
"valid_targets_min": 2634
},
{
"epoch": 0.12,
"grad_norm": 0.7203043506061609,
"learning_rate": 6.757990867579909e-06,
"loss": 0.513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5385029315948486,
"step": 75,
"valid_targets_mean": 4590.4,
"valid_targets_min": 1978
},
{
"epoch": 0.128,
"grad_norm": 0.5376106997657275,
"learning_rate": 7.214611872146119e-06,
"loss": 0.516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4749385714530945,
"step": 80,
"valid_targets_mean": 6827.4,
"valid_targets_min": 3176
},
{
"epoch": 0.136,
"grad_norm": 0.6106498365181853,
"learning_rate": 7.671232876712329e-06,
"loss": 0.5076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49556079506874084,
"step": 85,
"valid_targets_mean": 5444.6,
"valid_targets_min": 2821
},
{
"epoch": 0.144,
"grad_norm": 0.5289997229974207,
"learning_rate": 8.127853881278539e-06,
"loss": 0.4685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.431709349155426,
"step": 90,
"valid_targets_mean": 6285.6,
"valid_targets_min": 2326
},
{
"epoch": 0.152,
"grad_norm": 0.5416140795290694,
"learning_rate": 8.584474885844748e-06,
"loss": 0.4608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4308019280433655,
"step": 95,
"valid_targets_mean": 5831.9,
"valid_targets_min": 2332
},
{
"epoch": 0.16,
"grad_norm": 0.5038587793531678,
"learning_rate": 9.04109589041096e-06,
"loss": 0.4727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44734400510787964,
"step": 100,
"valid_targets_mean": 6098.7,
"valid_targets_min": 2794
},
{
"epoch": 0.168,
"grad_norm": 0.6499130358808322,
"learning_rate": 9.49771689497717e-06,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46700429916381836,
"step": 105,
"valid_targets_mean": 5643.3,
"valid_targets_min": 3348
},
{
"epoch": 0.176,
"grad_norm": 0.5164488739469887,
"learning_rate": 9.95433789954338e-06,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4107072949409485,
"step": 110,
"valid_targets_mean": 5961.1,
"valid_targets_min": 2021
},
{
"epoch": 0.184,
"grad_norm": 0.6640110036460022,
"learning_rate": 1.0410958904109589e-05,
"loss": 0.4481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.418204665184021,
"step": 115,
"valid_targets_mean": 4624.6,
"valid_targets_min": 2451
},
{
"epoch": 0.192,
"grad_norm": 0.5285519912988442,
"learning_rate": 1.08675799086758e-05,
"loss": 0.4061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4019206464290619,
"step": 120,
"valid_targets_mean": 5007.2,
"valid_targets_min": 3000
},
{
"epoch": 0.2,
"grad_norm": 0.6548167137474712,
"learning_rate": 1.132420091324201e-05,
"loss": 0.4426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4582175612449646,
"step": 125,
"valid_targets_mean": 6787.3,
"valid_targets_min": 2528
},
{
"epoch": 0.208,
"grad_norm": 0.5867537785236684,
"learning_rate": 1.178082191780822e-05,
"loss": 0.4217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44458815455436707,
"step": 130,
"valid_targets_mean": 5277.4,
"valid_targets_min": 2969
},
{
"epoch": 0.216,
"grad_norm": 0.5692868498717647,
"learning_rate": 1.223744292237443e-05,
"loss": 0.413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4310612082481384,
"step": 135,
"valid_targets_mean": 5636.2,
"valid_targets_min": 230
},
{
"epoch": 0.224,
"grad_norm": 0.4977876660314295,
"learning_rate": 1.2694063926940641e-05,
"loss": 0.3913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35761088132858276,
"step": 140,
"valid_targets_mean": 6244.7,
"valid_targets_min": 1660
},
{
"epoch": 0.232,
"grad_norm": 0.5977951035748577,
"learning_rate": 1.3150684931506849e-05,
"loss": 0.4021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4173124432563782,
"step": 145,
"valid_targets_mean": 6014.3,
"valid_targets_min": 2804
},
{
"epoch": 0.24,
"grad_norm": 0.5896906397538862,
"learning_rate": 1.360730593607306e-05,
"loss": 0.4133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42406731843948364,
"step": 150,
"valid_targets_mean": 5189.6,
"valid_targets_min": 2551
},
{
"epoch": 0.248,
"grad_norm": 0.5871809118104986,
"learning_rate": 1.406392694063927e-05,
"loss": 0.4066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3785093426704407,
"step": 155,
"valid_targets_mean": 5138.2,
"valid_targets_min": 2204
},
{
"epoch": 0.256,
"grad_norm": 0.5323983997580389,
"learning_rate": 1.4520547945205482e-05,
"loss": 0.4003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37402379512786865,
"step": 160,
"valid_targets_mean": 5847.3,
"valid_targets_min": 2233
},
{
"epoch": 0.264,
"grad_norm": 0.5657381387600574,
"learning_rate": 1.497716894977169e-05,
"loss": 0.384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3925345540046692,
"step": 165,
"valid_targets_mean": 4730.1,
"valid_targets_min": 798
},
{
"epoch": 0.272,
"grad_norm": 0.5962892332796642,
"learning_rate": 1.54337899543379e-05,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36262843012809753,
"step": 170,
"valid_targets_mean": 4678.3,
"valid_targets_min": 1850
},
{
"epoch": 0.28,
"grad_norm": 0.5815083569532998,
"learning_rate": 1.589041095890411e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39265549182891846,
"step": 175,
"valid_targets_mean": 4959.8,
"valid_targets_min": 901
},
{
"epoch": 0.288,
"grad_norm": 0.6169273432083452,
"learning_rate": 1.634703196347032e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38367488980293274,
"step": 180,
"valid_targets_mean": 5054.1,
"valid_targets_min": 2086
},
{
"epoch": 0.296,
"grad_norm": 0.5073520805794912,
"learning_rate": 1.680365296803653e-05,
"loss": 0.3696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35496461391448975,
"step": 185,
"valid_targets_mean": 5353.8,
"valid_targets_min": 2311
},
{
"epoch": 0.304,
"grad_norm": 0.5951830285204442,
"learning_rate": 1.726027397260274e-05,
"loss": 0.3697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3645014762878418,
"step": 190,
"valid_targets_mean": 5700.0,
"valid_targets_min": 3838
},
{
"epoch": 0.312,
"grad_norm": 3.284936406262614,
"learning_rate": 1.771689497716895e-05,
"loss": 0.3734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3810313045978546,
"step": 195,
"valid_targets_mean": 4864.6,
"valid_targets_min": 2229
},
{
"epoch": 0.32,
"grad_norm": 0.5815089840052964,
"learning_rate": 1.8173515981735163e-05,
"loss": 0.3804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39126527309417725,
"step": 200,
"valid_targets_mean": 5333.4,
"valid_targets_min": 786
},
{
"epoch": 0.328,
"grad_norm": 0.5871232329779636,
"learning_rate": 1.863013698630137e-05,
"loss": 0.3975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33873528242111206,
"step": 205,
"valid_targets_mean": 5260.6,
"valid_targets_min": 2590
},
{
"epoch": 0.336,
"grad_norm": 0.5623908127082623,
"learning_rate": 1.9086757990867582e-05,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3926033079624176,
"step": 210,
"valid_targets_mean": 5914.9,
"valid_targets_min": 2290
},
{
"epoch": 0.344,
"grad_norm": 0.5829996789134975,
"learning_rate": 1.954337899543379e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36474674940109253,
"step": 215,
"valid_targets_mean": 5885.6,
"valid_targets_min": 1668
},
{
"epoch": 0.352,
"grad_norm": 0.5814734468612167,
"learning_rate": 2e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40361806750297546,
"step": 220,
"valid_targets_mean": 6311.9,
"valid_targets_min": 2249
},
{
"epoch": 0.36,
"grad_norm": 0.5922468705700561,
"learning_rate": 2.045662100456621e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3497602939605713,
"step": 225,
"valid_targets_mean": 5419.3,
"valid_targets_min": 2622
},
{
"epoch": 0.368,
"grad_norm": 0.522456463858042,
"learning_rate": 2.0913242009132424e-05,
"loss": 0.3675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36271563172340393,
"step": 230,
"valid_targets_mean": 6095.4,
"valid_targets_min": 2460
},
{
"epoch": 0.376,
"grad_norm": 0.6424635869072116,
"learning_rate": 2.1369863013698632e-05,
"loss": 0.3867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4467678964138031,
"step": 235,
"valid_targets_mean": 6817.1,
"valid_targets_min": 604
},
{
"epoch": 0.384,
"grad_norm": 0.6594713274606352,
"learning_rate": 2.182648401826484e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3981528878211975,
"step": 240,
"valid_targets_mean": 4952.9,
"valid_targets_min": 761
},
{
"epoch": 0.392,
"grad_norm": 0.5529439179880414,
"learning_rate": 2.2283105022831052e-05,
"loss": 0.3679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3784303665161133,
"step": 245,
"valid_targets_mean": 6425.6,
"valid_targets_min": 2506
},
{
"epoch": 0.4,
"grad_norm": 0.5831354430338912,
"learning_rate": 2.2739726027397263e-05,
"loss": 0.3759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3691878318786621,
"step": 250,
"valid_targets_mean": 5749.1,
"valid_targets_min": 1980
},
{
"epoch": 0.408,
"grad_norm": 0.65000190634853,
"learning_rate": 2.3196347031963475e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3631196618080139,
"step": 255,
"valid_targets_mean": 4850.5,
"valid_targets_min": 759
},
{
"epoch": 0.416,
"grad_norm": 0.6645578317049943,
"learning_rate": 2.3652968036529683e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3574402630329132,
"step": 260,
"valid_targets_mean": 4735.8,
"valid_targets_min": 2466
},
{
"epoch": 0.424,
"grad_norm": 0.6656191465639894,
"learning_rate": 2.410958904109589e-05,
"loss": 0.3619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.362774521112442,
"step": 265,
"valid_targets_mean": 6647.6,
"valid_targets_min": 2383
},
{
"epoch": 0.432,
"grad_norm": 0.5851717481481281,
"learning_rate": 2.4566210045662106e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33157211542129517,
"step": 270,
"valid_targets_mean": 4614.8,
"valid_targets_min": 1941
},
{
"epoch": 0.44,
"grad_norm": 0.5751797691958569,
"learning_rate": 2.5022831050228314e-05,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31601348519325256,
"step": 275,
"valid_targets_mean": 5310.1,
"valid_targets_min": 2662
},
{
"epoch": 0.448,
"grad_norm": 0.5643551630768594,
"learning_rate": 2.547945205479452e-05,
"loss": 0.3632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36333590745925903,
"step": 280,
"valid_targets_mean": 5489.1,
"valid_targets_min": 1956
},
{
"epoch": 0.456,
"grad_norm": 0.5452707045878729,
"learning_rate": 2.593607305936073e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3407953381538391,
"step": 285,
"valid_targets_mean": 5989.4,
"valid_targets_min": 3143
},
{
"epoch": 0.464,
"grad_norm": 0.6015341682807512,
"learning_rate": 2.6392694063926944e-05,
"loss": 0.3495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36542242765426636,
"step": 290,
"valid_targets_mean": 4879.5,
"valid_targets_min": 904
},
{
"epoch": 0.472,
"grad_norm": 0.4933163499696808,
"learning_rate": 2.6849315068493153e-05,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3441370725631714,
"step": 295,
"valid_targets_mean": 6533.8,
"valid_targets_min": 2505
},
{
"epoch": 0.48,
"grad_norm": 0.6570928110972526,
"learning_rate": 2.7305936073059364e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32394760847091675,
"step": 300,
"valid_targets_mean": 5315.5,
"valid_targets_min": 490
},
{
"epoch": 0.488,
"grad_norm": 0.5963639828543595,
"learning_rate": 2.7762557077625572e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3477485775947571,
"step": 305,
"valid_targets_mean": 5883.1,
"valid_targets_min": 838
},
{
"epoch": 0.496,
"grad_norm": 0.5867601585655516,
"learning_rate": 2.8219178082191783e-05,
"loss": 0.3416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3327102065086365,
"step": 310,
"valid_targets_mean": 6452.5,
"valid_targets_min": 3225
},
{
"epoch": 0.504,
"grad_norm": 0.6010215270774765,
"learning_rate": 2.8675799086757995e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33421438932418823,
"step": 315,
"valid_targets_mean": 5088.0,
"valid_targets_min": 1962
},
{
"epoch": 0.512,
"grad_norm": 0.5707370764644752,
"learning_rate": 2.9132420091324203e-05,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33381012082099915,
"step": 320,
"valid_targets_mean": 5421.4,
"valid_targets_min": 1666
},
{
"epoch": 0.52,
"grad_norm": 0.5906992975596219,
"learning_rate": 2.958904109589041e-05,
"loss": 0.3622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3678559362888336,
"step": 325,
"valid_targets_mean": 6029.4,
"valid_targets_min": 2516
},
{
"epoch": 0.528,
"grad_norm": 0.5371802016216455,
"learning_rate": 3.0045662100456626e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999245524406433,
"step": 330,
"valid_targets_mean": 5799.5,
"valid_targets_min": 3433
},
{
"epoch": 0.536,
"grad_norm": 0.5822954280809008,
"learning_rate": 3.0502283105022834e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33282238245010376,
"step": 335,
"valid_targets_mean": 4737.1,
"valid_targets_min": 1791
},
{
"epoch": 0.544,
"grad_norm": 0.6029890531225149,
"learning_rate": 3.0958904109589045e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3635110855102539,
"step": 340,
"valid_targets_mean": 5499.4,
"valid_targets_min": 2056
},
{
"epoch": 0.552,
"grad_norm": 0.5655087348685645,
"learning_rate": 3.141552511415525e-05,
"loss": 0.3387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37209635972976685,
"step": 345,
"valid_targets_mean": 5426.6,
"valid_targets_min": 563
},
{
"epoch": 0.56,
"grad_norm": 0.5333462848275267,
"learning_rate": 3.187214611872147e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3303799331188202,
"step": 350,
"valid_targets_mean": 5406.4,
"valid_targets_min": 779
},
{
"epoch": 0.568,
"grad_norm": 0.5295185279670263,
"learning_rate": 3.2328767123287676e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32677990198135376,
"step": 355,
"valid_targets_mean": 5974.3,
"valid_targets_min": 1628
},
{
"epoch": 0.576,
"grad_norm": 0.5983539503289153,
"learning_rate": 3.2785388127853884e-05,
"loss": 0.3459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39269623160362244,
"step": 360,
"valid_targets_mean": 6738.8,
"valid_targets_min": 1678
},
{
"epoch": 0.584,
"grad_norm": 0.5766745460057539,
"learning_rate": 3.324200913242009e-05,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29778122901916504,
"step": 365,
"valid_targets_mean": 5049.4,
"valid_targets_min": 2193
},
{
"epoch": 0.592,
"grad_norm": 0.6277621549756567,
"learning_rate": 3.369863013698631e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3347325921058655,
"step": 370,
"valid_targets_mean": 5283.5,
"valid_targets_min": 2402
},
{
"epoch": 0.6,
"grad_norm": 0.5918373851674901,
"learning_rate": 3.4155251141552515e-05,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36557674407958984,
"step": 375,
"valid_targets_mean": 5248.7,
"valid_targets_min": 2252
},
{
"epoch": 0.608,
"grad_norm": 0.6167625201761314,
"learning_rate": 3.461187214611872e-05,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086686432361603,
"step": 380,
"valid_targets_mean": 4223.2,
"valid_targets_min": 711
},
{
"epoch": 0.616,
"grad_norm": 0.5591693735982324,
"learning_rate": 3.506849315068493e-05,
"loss": 0.3504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.368280827999115,
"step": 385,
"valid_targets_mean": 5700.3,
"valid_targets_min": 904
},
{
"epoch": 0.624,
"grad_norm": 0.5799417720813952,
"learning_rate": 3.5525114155251146e-05,
"loss": 0.3294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3143656551837921,
"step": 390,
"valid_targets_mean": 5221.9,
"valid_targets_min": 536
},
{
"epoch": 0.632,
"grad_norm": 0.5433992211523737,
"learning_rate": 3.5981735159817354e-05,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3558363914489746,
"step": 395,
"valid_targets_mean": 5620.7,
"valid_targets_min": 2461
},
{
"epoch": 0.64,
"grad_norm": 0.5621911130490547,
"learning_rate": 3.643835616438356e-05,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33586400747299194,
"step": 400,
"valid_targets_mean": 6311.3,
"valid_targets_min": 3458
},
{
"epoch": 0.648,
"grad_norm": 0.509645925031835,
"learning_rate": 3.689497716894977e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32601773738861084,
"step": 405,
"valid_targets_mean": 6338.4,
"valid_targets_min": 2329
},
{
"epoch": 0.656,
"grad_norm": 0.5678298273897082,
"learning_rate": 3.7351598173515985e-05,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3719245195388794,
"step": 410,
"valid_targets_mean": 5888.6,
"valid_targets_min": 2675
},
{
"epoch": 0.664,
"grad_norm": 0.5606239723542871,
"learning_rate": 3.780821917808219e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3294365406036377,
"step": 415,
"valid_targets_mean": 5571.3,
"valid_targets_min": 2321
},
{
"epoch": 0.672,
"grad_norm": 0.6903980569872955,
"learning_rate": 3.82648401826484e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35279595851898193,
"step": 420,
"valid_targets_mean": 6234.4,
"valid_targets_min": 631
},
{
"epoch": 0.68,
"grad_norm": 0.5770701013621418,
"learning_rate": 3.8721461187214615e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3458443582057953,
"step": 425,
"valid_targets_mean": 5096.1,
"valid_targets_min": 2409
},
{
"epoch": 0.688,
"grad_norm": 0.7015744477293635,
"learning_rate": 3.9178082191780823e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3228449821472168,
"step": 430,
"valid_targets_mean": 4802.9,
"valid_targets_min": 932
},
{
"epoch": 0.696,
"grad_norm": 0.5814276027663211,
"learning_rate": 3.963470319634704e-05,
"loss": 0.3348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3646930754184723,
"step": 435,
"valid_targets_mean": 5815.1,
"valid_targets_min": 2370
},
{
"epoch": 0.704,
"grad_norm": 0.6088081325835798,
"learning_rate": 3.99999936325009e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3166343569755554,
"step": 440,
"valid_targets_mean": 6217.9,
"valid_targets_min": 2075
},
{
"epoch": 0.712,
"grad_norm": 0.5402127247441519,
"learning_rate": 3.9999770770457856e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31158143281936646,
"step": 445,
"valid_targets_mean": 6205.0,
"valid_targets_min": 913
},
{
"epoch": 0.72,
"grad_norm": 0.6399233174311737,
"learning_rate": 3.9999229537513936e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32378578186035156,
"step": 450,
"valid_targets_mean": 4884.4,
"valid_targets_min": 1215
},
{
"epoch": 0.728,
"grad_norm": 0.5915756632434621,
"learning_rate": 3.999836994228487e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3110769987106323,
"step": 455,
"valid_targets_mean": 5154.0,
"valid_targets_min": 1728
},
{
"epoch": 0.736,
"grad_norm": 0.6319049650168674,
"learning_rate": 3.999719199845432e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32748833298683167,
"step": 460,
"valid_targets_mean": 5428.9,
"valid_targets_min": 2531
},
{
"epoch": 0.744,
"grad_norm": 0.5700199682389311,
"learning_rate": 3.999569572477366e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33130866289138794,
"step": 465,
"valid_targets_mean": 5058.3,
"valid_targets_min": 1760
},
{
"epoch": 0.752,
"grad_norm": 0.5092781146395354,
"learning_rate": 3.999388114506166e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3101567327976227,
"step": 470,
"valid_targets_mean": 5335.4,
"valid_targets_min": 2946
},
{
"epoch": 0.76,
"grad_norm": 0.5794130728227729,
"learning_rate": 3.999174828820413e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30423641204833984,
"step": 475,
"valid_targets_mean": 4474.7,
"valid_targets_min": 2081
},
{
"epoch": 0.768,
"grad_norm": 0.5448773661149979,
"learning_rate": 3.998929718815341e-05,
"loss": 0.3316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32564234733581543,
"step": 480,
"valid_targets_mean": 5164.1,
"valid_targets_min": 2488
},
{
"epoch": 0.776,
"grad_norm": 0.5387594305910872,
"learning_rate": 3.998652788392792e-05,
"loss": 0.3269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3404187262058258,
"step": 485,
"valid_targets_mean": 5412.6,
"valid_targets_min": 818
},
{
"epoch": 0.784,
"grad_norm": 0.5854237384124716,
"learning_rate": 3.9983440419611445e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3279475271701813,
"step": 490,
"valid_targets_mean": 4456.4,
"valid_targets_min": 1879
},
{
"epoch": 0.792,
"grad_norm": 0.564775380231534,
"learning_rate": 3.9980034844352494e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3300333321094513,
"step": 495,
"valid_targets_mean": 5009.7,
"valid_targets_min": 2930
},
{
"epoch": 0.8,
"grad_norm": 0.5293883302680141,
"learning_rate": 3.9976311212363495e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3328399658203125,
"step": 500,
"valid_targets_mean": 6093.4,
"valid_targets_min": 3097
},
{
"epoch": 0.808,
"grad_norm": 0.5789613836327289,
"learning_rate": 3.997226958291992e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30174410343170166,
"step": 505,
"valid_targets_mean": 4972.1,
"valid_targets_min": 2321
},
{
"epoch": 0.816,
"grad_norm": 0.5132049869786744,
"learning_rate": 3.996791002035937e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34351909160614014,
"step": 510,
"valid_targets_mean": 6353.1,
"valid_targets_min": 2811
},
{
"epoch": 0.824,
"grad_norm": 0.5128789381578767,
"learning_rate": 3.996323259408055e-05,
"loss": 0.3237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3485877215862274,
"step": 515,
"valid_targets_mean": 5549.4,
"valid_targets_min": 740
},
{
"epoch": 0.832,
"grad_norm": 0.5402172060969582,
"learning_rate": 3.995823737854211e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30282849073410034,
"step": 520,
"valid_targets_mean": 6072.9,
"valid_targets_min": 1872
},
{
"epoch": 0.84,
"grad_norm": 0.5515819926347459,
"learning_rate": 3.9952924453261534e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2936662435531616,
"step": 525,
"valid_targets_mean": 4590.2,
"valid_targets_min": 2248
},
{
"epoch": 0.848,
"grad_norm": 0.5285706315693174,
"learning_rate": 3.994729390281384e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3250778913497925,
"step": 530,
"valid_targets_mean": 5578.5,
"valid_targets_min": 2616
},
{
"epoch": 0.856,
"grad_norm": 0.5502402081859151,
"learning_rate": 3.994134581683021e-05,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3574582040309906,
"step": 535,
"valid_targets_mean": 5670.8,
"valid_targets_min": 3313
},
{
"epoch": 0.864,
"grad_norm": 0.5016293419426597,
"learning_rate": 3.9935080289996626e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080974221229553,
"step": 540,
"valid_targets_mean": 5986.4,
"valid_targets_min": 2539
},
{
"epoch": 0.872,
"grad_norm": 0.5660291944457707,
"learning_rate": 3.992849742205228e-05,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31069374084472656,
"step": 545,
"valid_targets_mean": 6014.2,
"valid_targets_min": 2454
},
{
"epoch": 0.88,
"grad_norm": 0.46398599640649046,
"learning_rate": 3.9921597317788065e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050593435764313,
"step": 550,
"valid_targets_mean": 6101.0,
"valid_targets_min": 4913
},
{
"epoch": 0.888,
"grad_norm": 0.5349679943298677,
"learning_rate": 3.991438008704486e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3825862407684326,
"step": 555,
"valid_targets_mean": 7490.4,
"valid_targets_min": 1967
},
{
"epoch": 0.896,
"grad_norm": 0.5129679083648333,
"learning_rate": 3.990684584471179e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3344353437423706,
"step": 560,
"valid_targets_mean": 5056.2,
"valid_targets_min": 991
},
{
"epoch": 0.904,
"grad_norm": 0.5114013214259068,
"learning_rate": 3.989899471072441e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32178831100463867,
"step": 565,
"valid_targets_mean": 5480.6,
"valid_targets_min": 2776
},
{
"epoch": 0.912,
"grad_norm": 0.5551757388586439,
"learning_rate": 3.9890826810062784e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3461974859237671,
"step": 570,
"valid_targets_mean": 5539.6,
"valid_targets_min": 3173
},
{
"epoch": 0.92,
"grad_norm": 0.48095163281778175,
"learning_rate": 3.988234227274949e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3255422115325928,
"step": 575,
"valid_targets_mean": 6356.3,
"valid_targets_min": 2670
},
{
"epoch": 0.928,
"grad_norm": 0.5337169643841331,
"learning_rate": 3.987354123384757e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3116692304611206,
"step": 580,
"valid_targets_mean": 5684.5,
"valid_targets_min": 3490
},
{
"epoch": 0.936,
"grad_norm": 0.5548195739252937,
"learning_rate": 3.9864423833458364e-05,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080330789089203,
"step": 585,
"valid_targets_mean": 4697.8,
"valid_targets_min": 1989
},
{
"epoch": 0.944,
"grad_norm": 0.5335506041335158,
"learning_rate": 3.9854990216719285e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2945554554462433,
"step": 590,
"valid_targets_mean": 4857.4,
"valid_targets_min": 2493
},
{
"epoch": 0.952,
"grad_norm": 0.4930115107440699,
"learning_rate": 3.98452405338015e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29840582609176636,
"step": 595,
"valid_targets_mean": 5117.4,
"valid_targets_min": 833
},
{
"epoch": 0.96,
"grad_norm": 0.48996673143333463,
"learning_rate": 3.983517493990756e-05,
"loss": 0.3206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30873602628707886,
"step": 600,
"valid_targets_mean": 5820.4,
"valid_targets_min": 1017
},
{
"epoch": 0.968,
"grad_norm": 0.5283852318337353,
"learning_rate": 3.982479359526892e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3178045153617859,
"step": 605,
"valid_targets_mean": 5300.6,
"valid_targets_min": 1851
},
{
"epoch": 0.976,
"grad_norm": 0.5001051716337229,
"learning_rate": 3.981409666514336e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31478673219680786,
"step": 610,
"valid_targets_mean": 6632.8,
"valid_targets_min": 2269
},
{
"epoch": 0.984,
"grad_norm": 0.6753756767282909,
"learning_rate": 3.98030843198124e-05,
"loss": 0.3247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31617915630340576,
"step": 615,
"valid_targets_mean": 5035.5,
"valid_targets_min": 768
},
{
"epoch": 0.992,
"grad_norm": 0.5005628037703251,
"learning_rate": 3.979175673457858e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3059810400009155,
"step": 620,
"valid_targets_mean": 5247.0,
"valid_targets_min": 2168
},
{
"epoch": 1.0,
"grad_norm": 0.5101683864070548,
"learning_rate": 3.9780114089762616e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3115279972553253,
"step": 625,
"valid_targets_mean": 6066.2,
"valid_targets_min": 2665
},
{
"epoch": 1.008,
"grad_norm": 0.5061533542766917,
"learning_rate": 3.976815657070062e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32069745659828186,
"step": 630,
"valid_targets_mean": 5403.9,
"valid_targets_min": 2594
},
{
"epoch": 1.016,
"grad_norm": 0.5059001703699166,
"learning_rate": 3.975588436774107e-05,
"loss": 0.3294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3165131211280823,
"step": 635,
"valid_targets_mean": 6142.6,
"valid_targets_min": 647
},
{
"epoch": 1.024,
"grad_norm": 0.4533978910070391,
"learning_rate": 3.9743297676241826e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3258289396762848,
"step": 640,
"valid_targets_mean": 6012.1,
"valid_targets_min": 2008
},
{
"epoch": 1.032,
"grad_norm": 0.5083341694516313,
"learning_rate": 3.9730396696566994e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31480103731155396,
"step": 645,
"valid_targets_mean": 6597.6,
"valid_targets_min": 3755
},
{
"epoch": 1.04,
"grad_norm": 0.4935210278014131,
"learning_rate": 3.971718163408375e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2967149019241333,
"step": 650,
"valid_targets_mean": 5684.5,
"valid_targets_min": 708
},
{
"epoch": 1.048,
"grad_norm": 0.565325705266283,
"learning_rate": 3.9703652699159093e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30539369583129883,
"step": 655,
"valid_targets_mean": 4551.8,
"valid_targets_min": 714
},
{
"epoch": 1.056,
"grad_norm": 0.4905273364614086,
"learning_rate": 3.9689810107156425e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29835695028305054,
"step": 660,
"valid_targets_mean": 5777.5,
"valid_targets_min": 2063
},
{
"epoch": 1.064,
"grad_norm": 0.4661058379526559,
"learning_rate": 3.967565407843222e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.276365727186203,
"step": 665,
"valid_targets_mean": 5450.4,
"valid_targets_min": 2204
},
{
"epoch": 1.072,
"grad_norm": 0.5603469801480837,
"learning_rate": 3.966118483833242e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33001142740249634,
"step": 670,
"valid_targets_mean": 6528.9,
"valid_targets_min": 789
},
{
"epoch": 1.08,
"grad_norm": 0.5197535966327156,
"learning_rate": 3.964640261718893e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953532934188843,
"step": 675,
"valid_targets_mean": 4881.6,
"valid_targets_min": 1040
},
{
"epoch": 1.088,
"grad_norm": 0.4678919417514522,
"learning_rate": 3.963130765031589e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2858159840106964,
"step": 680,
"valid_targets_mean": 5310.2,
"valid_targets_min": 2368
},
{
"epoch": 1.096,
"grad_norm": 0.484112524785576,
"learning_rate": 3.961590017800598e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966598868370056,
"step": 685,
"valid_targets_mean": 5507.7,
"valid_targets_min": 779
},
{
"epoch": 1.104,
"grad_norm": 0.4984597429065734,
"learning_rate": 3.960018044552653e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29976171255111694,
"step": 690,
"valid_targets_mean": 5569.8,
"valid_targets_min": 2526
},
{
"epoch": 1.112,
"grad_norm": 0.4787188881097212,
"learning_rate": 3.9584148703115704e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30830392241477966,
"step": 695,
"valid_targets_mean": 5337.4,
"valid_targets_min": 2429
},
{
"epoch": 1.12,
"grad_norm": 0.4902996758578751,
"learning_rate": 3.956780520597842e-05,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992423474788666,
"step": 700,
"valid_targets_mean": 5177.4,
"valid_targets_min": 2765
},
{
"epoch": 1.1280000000000001,
"grad_norm": 0.4774544301602382,
"learning_rate": 3.955115021428236e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31589141488075256,
"step": 705,
"valid_targets_mean": 5750.9,
"valid_targets_min": 2097
},
{
"epoch": 1.1360000000000001,
"grad_norm": 0.4236448807576577,
"learning_rate": 3.95341839931538e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3106244206428528,
"step": 710,
"valid_targets_mean": 7255.8,
"valid_targets_min": 3054
},
{
"epoch": 1.144,
"grad_norm": 0.4668295458159508,
"learning_rate": 3.95169068126734e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30808717012405396,
"step": 715,
"valid_targets_mean": 6632.2,
"valid_targets_min": 2729
},
{
"epoch": 1.152,
"grad_norm": 0.5435292950469758,
"learning_rate": 3.949931894787187e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3164767920970917,
"step": 720,
"valid_targets_mean": 5680.6,
"valid_targets_min": 2794
},
{
"epoch": 1.16,
"grad_norm": 0.5281852061014428,
"learning_rate": 3.948142067872565e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2959475517272949,
"step": 725,
"valid_targets_mean": 5686.9,
"valid_targets_min": 2968
},
{
"epoch": 1.168,
"grad_norm": 0.4983171972870052,
"learning_rate": 3.946321229015241e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3173370361328125,
"step": 730,
"valid_targets_mean": 5205.5,
"valid_targets_min": 809
},
{
"epoch": 1.176,
"grad_norm": 0.4890718645725748,
"learning_rate": 3.944469407200652e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3072756230831146,
"step": 735,
"valid_targets_mean": 5731.9,
"valid_targets_min": 2480
},
{
"epoch": 1.184,
"grad_norm": 0.47357704723925165,
"learning_rate": 3.942586631907444e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28427958488464355,
"step": 740,
"valid_targets_mean": 6041.5,
"valid_targets_min": 2130
},
{
"epoch": 1.192,
"grad_norm": 0.5453762286495085,
"learning_rate": 3.9406729331070054e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.295629620552063,
"step": 745,
"valid_targets_mean": 5579.8,
"valid_targets_min": 997
},
{
"epoch": 1.2,
"grad_norm": 0.4852696909448581,
"learning_rate": 3.938728341262985e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32111233472824097,
"step": 750,
"valid_targets_mean": 5610.9,
"valid_targets_min": 1678
},
{
"epoch": 1.208,
"grad_norm": 0.4935199675479707,
"learning_rate": 3.936752887330812e-05,
"loss": 0.3204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3121909201145172,
"step": 755,
"valid_targets_mean": 5657.9,
"valid_targets_min": 3379
},
{
"epoch": 1.216,
"grad_norm": 0.5449908430487179,
"learning_rate": 3.9347466027571975e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29402291774749756,
"step": 760,
"valid_targets_mean": 5161.4,
"valid_targets_min": 1967
},
{
"epoch": 1.224,
"grad_norm": 0.45633103438298667,
"learning_rate": 3.932709519479639e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34494248032569885,
"step": 765,
"valid_targets_mean": 6849.4,
"valid_targets_min": 4095
},
{
"epoch": 1.232,
"grad_norm": 0.47019749701597285,
"learning_rate": 3.930641669925911e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30092108249664307,
"step": 770,
"valid_targets_mean": 6349.1,
"valid_targets_min": 2875
},
{
"epoch": 1.24,
"grad_norm": 0.5201632699890976,
"learning_rate": 3.928543087013546e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793954014778137,
"step": 775,
"valid_targets_mean": 4882.1,
"valid_targets_min": 1988
},
{
"epoch": 1.248,
"grad_norm": 0.49981243099331757,
"learning_rate": 3.926413804149315e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935693860054016,
"step": 780,
"valid_targets_mean": 6399.2,
"valid_targets_min": 1814
},
{
"epoch": 1.256,
"grad_norm": 0.4697792529332793,
"learning_rate": 3.9242538552286894e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31196436285972595,
"step": 785,
"valid_targets_mean": 6547.4,
"valid_targets_min": 659
},
{
"epoch": 1.264,
"grad_norm": 0.5081110490095486,
"learning_rate": 3.9220632746353096e-05,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34884440898895264,
"step": 790,
"valid_targets_mean": 5839.6,
"valid_targets_min": 2563
},
{
"epoch": 1.272,
"grad_norm": 0.4245750286149305,
"learning_rate": 3.91984209724043e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31733453273773193,
"step": 795,
"valid_targets_mean": 7176.9,
"valid_targets_min": 3404
},
{
"epoch": 1.28,
"grad_norm": 0.4945888003308397,
"learning_rate": 3.917590358402369e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3026392459869385,
"step": 800,
"valid_targets_mean": 5278.9,
"valid_targets_min": 2117
},
{
"epoch": 1.288,
"grad_norm": 0.4743869642323437,
"learning_rate": 3.915308093965943e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2844420075416565,
"step": 805,
"valid_targets_mean": 5709.9,
"valid_targets_min": 2348
},
{
"epoch": 1.296,
"grad_norm": 0.6061193147263803,
"learning_rate": 3.9129953402618976e-05,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30593141913414,
"step": 810,
"valid_targets_mean": 4334.1,
"valid_targets_min": 766
},
{
"epoch": 1.304,
"grad_norm": 0.4995811617110616,
"learning_rate": 3.91065213410633e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3021504878997803,
"step": 815,
"valid_targets_mean": 5270.4,
"valid_targets_min": 3025
},
{
"epoch": 1.312,
"grad_norm": 0.5677510964504177,
"learning_rate": 3.908278512800098e-05,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28321537375450134,
"step": 820,
"valid_targets_mean": 5837.6,
"valid_targets_min": 1886
},
{
"epoch": 1.32,
"grad_norm": 0.4806450055573019,
"learning_rate": 3.905874514128235e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.285899817943573,
"step": 825,
"valid_targets_mean": 5459.9,
"valid_targets_min": 2177
},
{
"epoch": 1.328,
"grad_norm": 0.4638341935119887,
"learning_rate": 3.903440176359338e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896142303943634,
"step": 830,
"valid_targets_mean": 5199.6,
"valid_targets_min": 2706
},
{
"epoch": 1.336,
"grad_norm": 0.4829925681558631,
"learning_rate": 3.90097553824497e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30030563473701477,
"step": 835,
"valid_targets_mean": 5174.9,
"valid_targets_min": 1798
},
{
"epoch": 1.3439999999999999,
"grad_norm": 0.4540116364686032,
"learning_rate": 3.8984806390190304e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29696711897850037,
"step": 840,
"valid_targets_mean": 6698.7,
"valid_targets_min": 2721
},
{
"epoch": 1.3519999999999999,
"grad_norm": 0.46848218879375525,
"learning_rate": 3.895955518397141e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320040225982666,
"step": 845,
"valid_targets_mean": 5730.2,
"valid_targets_min": 607
},
{
"epoch": 1.3599999999999999,
"grad_norm": 0.46627572996018274,
"learning_rate": 3.893400216576011e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2929132878780365,
"step": 850,
"valid_targets_mean": 5770.9,
"valid_targets_min": 784
},
{
"epoch": 1.3679999999999999,
"grad_norm": 0.4997177540619092,
"learning_rate": 3.89081477423279e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30305910110473633,
"step": 855,
"valid_targets_mean": 5442.1,
"valid_targets_min": 2508
},
{
"epoch": 1.376,
"grad_norm": 0.46782451496329075,
"learning_rate": 3.888199232524434e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27627885341644287,
"step": 860,
"valid_targets_mean": 5929.6,
"valid_targets_min": 2027
},
{
"epoch": 1.384,
"grad_norm": 0.48097129853488274,
"learning_rate": 3.8855536330870354e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3025239109992981,
"step": 865,
"valid_targets_mean": 6750.7,
"valid_targets_min": 2133
},
{
"epoch": 1.392,
"grad_norm": 0.6100068929323097,
"learning_rate": 3.882878018035173e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3252163827419281,
"step": 870,
"valid_targets_mean": 4455.0,
"valid_targets_min": 1173
},
{
"epoch": 1.4,
"grad_norm": 0.5148159541342916,
"learning_rate": 3.880172429961232e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29258278012275696,
"step": 875,
"valid_targets_mean": 4651.9,
"valid_targets_min": 925
},
{
"epoch": 1.408,
"grad_norm": 0.5381895580511613,
"learning_rate": 3.877436911934733e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30743107199668884,
"step": 880,
"valid_targets_mean": 5533.6,
"valid_targets_min": 904
},
{
"epoch": 1.416,
"grad_norm": 0.4188291102566486,
"learning_rate": 3.874671507501641e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865792512893677,
"step": 885,
"valid_targets_mean": 5537.3,
"valid_targets_min": 2931
},
{
"epoch": 1.424,
"grad_norm": 0.4908922548894577,
"learning_rate": 3.871876260683677e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.330981582403183,
"step": 890,
"valid_targets_mean": 5801.6,
"valid_targets_min": 851
},
{
"epoch": 1.432,
"grad_norm": 0.4646370664832961,
"learning_rate": 3.869051215977612e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2849675118923187,
"step": 895,
"valid_targets_mean": 6021.3,
"valid_targets_min": 2230
},
{
"epoch": 1.44,
"grad_norm": 0.48222675658351327,
"learning_rate": 3.8661964183545634e-05,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672026455402374,
"step": 900,
"valid_targets_mean": 5221.6,
"valid_targets_min": 954
},
{
"epoch": 1.448,
"grad_norm": 0.45000451698113425,
"learning_rate": 3.863311913259276e-05,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2890450656414032,
"step": 905,
"valid_targets_mean": 5694.0,
"valid_targets_min": 1468
},
{
"epoch": 1.456,
"grad_norm": 0.5025170489351635,
"learning_rate": 3.860397746609402e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30842775106430054,
"step": 910,
"valid_targets_mean": 5658.1,
"valid_targets_min": 2233
},
{
"epoch": 1.464,
"grad_norm": 0.49901946092424515,
"learning_rate": 3.857453964794764e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28981584310531616,
"step": 915,
"valid_targets_mean": 4907.5,
"valid_targets_min": 945
},
{
"epoch": 1.472,
"grad_norm": 0.49525172496266556,
"learning_rate": 3.854480614676624e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704351544380188,
"step": 920,
"valid_targets_mean": 4829.2,
"valid_targets_min": 2224
},
{
"epoch": 1.48,
"grad_norm": 0.4569247307054098,
"learning_rate": 3.851477743586932e-05,
"loss": 0.3053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28220322728157043,
"step": 925,
"valid_targets_mean": 5560.4,
"valid_targets_min": 2442
},
{
"epoch": 1.488,
"grad_norm": 0.4870926051405198,
"learning_rate": 3.8484453993275746e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27977991104125977,
"step": 930,
"valid_targets_mean": 5836.9,
"valid_targets_min": 3443
},
{
"epoch": 1.496,
"grad_norm": 0.48160127940354946,
"learning_rate": 3.8453836301696134e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3110281825065613,
"step": 935,
"valid_targets_mean": 5640.1,
"valid_targets_min": 1980
},
{
"epoch": 1.504,
"grad_norm": 0.48779913431255106,
"learning_rate": 3.842292484852518e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3401919901371002,
"step": 940,
"valid_targets_mean": 5965.8,
"valid_targets_min": 913
},
{
"epoch": 1.512,
"grad_norm": 0.4287904629804472,
"learning_rate": 3.8391720125833875e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.391912579536438,
"step": 945,
"valid_targets_mean": 6960.0,
"valid_targets_min": 613
},
{
"epoch": 1.52,
"grad_norm": 0.45454070436489985,
"learning_rate": 3.83602226303617e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3041311204433441,
"step": 950,
"valid_targets_mean": 6276.3,
"valid_targets_min": 1965
},
{
"epoch": 1.528,
"grad_norm": 0.4367609607515258,
"learning_rate": 3.83284328635087e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31207773089408875,
"step": 955,
"valid_targets_mean": 6414.3,
"valid_targets_min": 2158
},
{
"epoch": 1.536,
"grad_norm": 0.47628978925952564,
"learning_rate": 3.829635133132751e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3053891658782959,
"step": 960,
"valid_targets_mean": 5082.9,
"valid_targets_min": 2155
},
{
"epoch": 1.544,
"grad_norm": 0.4578863740375709,
"learning_rate": 3.8263978544515304e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29359114170074463,
"step": 965,
"valid_targets_mean": 6367.7,
"valid_targets_min": 3567
},
{
"epoch": 1.552,
"grad_norm": 0.44590971239621957,
"learning_rate": 3.823131501840565e-05,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28205692768096924,
"step": 970,
"valid_targets_mean": 5617.2,
"valid_targets_min": 2831
},
{
"epoch": 1.56,
"grad_norm": 0.47647296867414674,
"learning_rate": 3.819836127296032e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29584789276123047,
"step": 975,
"valid_targets_mean": 5086.8,
"valid_targets_min": 2383
},
{
"epoch": 1.568,
"grad_norm": 0.44827088421612804,
"learning_rate": 3.8165117832761016e-05,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2906496524810791,
"step": 980,
"valid_targets_mean": 5322.4,
"valid_targets_min": 925
},
{
"epoch": 1.576,
"grad_norm": 0.46473511615349966,
"learning_rate": 3.813158522700098e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010580837726593,
"step": 985,
"valid_targets_mean": 6231.4,
"valid_targets_min": 2747
},
{
"epoch": 1.584,
"grad_norm": 0.46146412830588385,
"learning_rate": 3.809776398947665e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865464389324188,
"step": 990,
"valid_targets_mean": 5287.1,
"valid_targets_min": 2584
},
{
"epoch": 1.592,
"grad_norm": 0.41928387386535865,
"learning_rate": 3.806365465857908e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612549960613251,
"step": 995,
"valid_targets_mean": 6553.7,
"valid_targets_min": 2261
},
{
"epoch": 1.6,
"grad_norm": 0.4446606668239555,
"learning_rate": 3.802925777728541e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29210934042930603,
"step": 1000,
"valid_targets_mean": 5958.9,
"valid_targets_min": 2292
},
{
"epoch": 1.608,
"grad_norm": 0.4596824212829141,
"learning_rate": 3.799457389315023e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2969397306442261,
"step": 1005,
"valid_targets_mean": 5465.1,
"valid_targets_min": 2633
},
{
"epoch": 1.616,
"grad_norm": 0.4642174072728452,
"learning_rate": 3.795960355829683e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3383893370628357,
"step": 1010,
"valid_targets_mean": 5533.6,
"valid_targets_min": 1543
},
{
"epoch": 1.624,
"grad_norm": 0.41923015410914755,
"learning_rate": 3.7924347329408444e-05,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2893693447113037,
"step": 1015,
"valid_targets_mean": 6553.8,
"valid_targets_min": 2738
},
{
"epoch": 1.6320000000000001,
"grad_norm": 0.474798883715657,
"learning_rate": 3.788880576771937e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3074151873588562,
"step": 1020,
"valid_targets_mean": 5287.8,
"valid_targets_min": 920
},
{
"epoch": 1.6400000000000001,
"grad_norm": 0.4859351138274312,
"learning_rate": 3.785297943900605e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2984621822834015,
"step": 1025,
"valid_targets_mean": 4972.1,
"valid_targets_min": 3064
},
{
"epoch": 1.6480000000000001,
"grad_norm": 0.45439722658451603,
"learning_rate": 3.7816868913578044e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29881051182746887,
"step": 1030,
"valid_targets_mean": 6891.9,
"valid_targets_min": 797
},
{
"epoch": 1.6560000000000001,
"grad_norm": 0.4954789496970954,
"learning_rate": 3.778047476626897e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27837109565734863,
"step": 1035,
"valid_targets_mean": 4826.8,
"valid_targets_min": 2124
},
{
"epoch": 1.6640000000000001,
"grad_norm": 0.4486524659460757,
"learning_rate": 3.7743797576427335e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992919683456421,
"step": 1040,
"valid_targets_mean": 5997.5,
"valid_targets_min": 1923
},
{
"epoch": 1.6720000000000002,
"grad_norm": 0.4744725016895598,
"learning_rate": 3.770683792790733e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35754770040512085,
"step": 1045,
"valid_targets_mean": 5574.3,
"valid_targets_min": 2306
},
{
"epoch": 1.6800000000000002,
"grad_norm": 0.4619485199478231,
"learning_rate": 3.766959640905954e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26582252979278564,
"step": 1050,
"valid_targets_mean": 4876.6,
"valid_targets_min": 2432
},
{
"epoch": 1.688,
"grad_norm": 0.46452806236395455,
"learning_rate": 3.763207361272153e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735568583011627,
"step": 1055,
"valid_targets_mean": 4596.1,
"valid_targets_min": 862
},
{
"epoch": 1.696,
"grad_norm": 0.4613970271174457,
"learning_rate": 3.759427013620849e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30159851908683777,
"step": 1060,
"valid_targets_mean": 5337.3,
"valid_targets_min": 2797
},
{
"epoch": 1.704,
"grad_norm": 0.45254038624818077,
"learning_rate": 3.755618658130366e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.332949697971344,
"step": 1065,
"valid_targets_mean": 6322.7,
"valid_targets_min": 2395
},
{
"epoch": 1.712,
"grad_norm": 0.46132268024374845,
"learning_rate": 3.751782355424877e-05,
"loss": 0.3057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3081086277961731,
"step": 1070,
"valid_targets_mean": 5333.1,
"valid_targets_min": 676
},
{
"epoch": 1.72,
"grad_norm": 0.647810915100628,
"learning_rate": 3.7479181665734395e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2798285484313965,
"step": 1075,
"valid_targets_mean": 4865.9,
"valid_targets_min": 768
},
{
"epoch": 1.728,
"grad_norm": 0.4595256488279494,
"learning_rate": 3.7440261530890213e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30216994881629944,
"step": 1080,
"valid_targets_mean": 5566.8,
"valid_targets_min": 3165
},
{
"epoch": 1.736,
"grad_norm": 0.5173055386818666,
"learning_rate": 3.740106376927527e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26667511463165283,
"step": 1085,
"valid_targets_mean": 4258.4,
"valid_targets_min": 2453
},
{
"epoch": 1.744,
"grad_norm": 0.44729287065917317,
"learning_rate": 3.7361589004868035e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29991859197616577,
"step": 1090,
"valid_targets_mean": 5005.5,
"valid_targets_min": 1317
},
{
"epoch": 1.752,
"grad_norm": 0.4502413369795436,
"learning_rate": 3.7321837866056535e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.311065137386322,
"step": 1095,
"valid_targets_mean": 5624.9,
"valid_targets_min": 2808
},
{
"epoch": 1.76,
"grad_norm": 0.44388049018525816,
"learning_rate": 3.728181098562831e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32409796118736267,
"step": 1100,
"valid_targets_mean": 5841.8,
"valid_targets_min": 742
},
{
"epoch": 1.768,
"grad_norm": 0.4946267811455118,
"learning_rate": 3.7241509000760355e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3057519793510437,
"step": 1105,
"valid_targets_mean": 5293.1,
"valid_targets_min": 2960
},
{
"epoch": 1.776,
"grad_norm": 0.48440289350790505,
"learning_rate": 3.720093255300899e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29010993242263794,
"step": 1110,
"valid_targets_mean": 5239.8,
"valid_targets_min": 1797
},
{
"epoch": 1.784,
"grad_norm": 0.42075171272953676,
"learning_rate": 3.7160082288299645e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29798623919487,
"step": 1115,
"valid_targets_mean": 5845.2,
"valid_targets_min": 2606
},
{
"epoch": 1.792,
"grad_norm": 0.44876314392122135,
"learning_rate": 3.7118958856916534e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.317965030670166,
"step": 1120,
"valid_targets_mean": 5691.3,
"valid_targets_min": 729
},
{
"epoch": 1.8,
"grad_norm": 0.4562553068597693,
"learning_rate": 3.707756291349237e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3572045564651489,
"step": 1125,
"valid_targets_mean": 6273.2,
"valid_targets_min": 3036
},
{
"epoch": 1.808,
"grad_norm": 0.4654698361735082,
"learning_rate": 3.703589511699787e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775658369064331,
"step": 1130,
"valid_targets_mean": 5154.9,
"valid_targets_min": 1883
},
{
"epoch": 1.8159999999999998,
"grad_norm": 0.4585691012158252,
"learning_rate": 3.6993956130731355e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992740571498871,
"step": 1135,
"valid_targets_mean": 5435.6,
"valid_targets_min": 2525
},
{
"epoch": 1.8239999999999998,
"grad_norm": 0.423001138385012,
"learning_rate": 3.6951746622308106e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28858619928359985,
"step": 1140,
"valid_targets_mean": 5687.1,
"valid_targets_min": 926
},
{
"epoch": 1.8319999999999999,
"grad_norm": 0.43450074990970605,
"learning_rate": 3.69092672636498e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3227563500404358,
"step": 1145,
"valid_targets_mean": 7171.9,
"valid_targets_min": 4053
},
{
"epoch": 1.8399999999999999,
"grad_norm": 0.45663335612023054,
"learning_rate": 3.686651873097375e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3199521601200104,
"step": 1150,
"valid_targets_mean": 6205.1,
"valid_targets_min": 1888
},
{
"epoch": 1.8479999999999999,
"grad_norm": 0.40345881129581174,
"learning_rate": 3.682350170478223e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2745388150215149,
"step": 1155,
"valid_targets_mean": 6815.2,
"valid_targets_min": 2696
},
{
"epoch": 1.8559999999999999,
"grad_norm": 0.4739803045161771,
"learning_rate": 3.678021686985153e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3329041302204132,
"step": 1160,
"valid_targets_mean": 6181.8,
"valid_targets_min": 2589
},
{
"epoch": 1.8639999999999999,
"grad_norm": 0.4119410013072989,
"learning_rate": 3.6736664915221144e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29115116596221924,
"step": 1165,
"valid_targets_mean": 6576.3,
"valid_targets_min": 965
},
{
"epoch": 1.8719999999999999,
"grad_norm": 0.4383779875712353,
"learning_rate": 3.669284653418278e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30039533972740173,
"step": 1170,
"valid_targets_mean": 6318.1,
"valid_targets_min": 3353
},
{
"epoch": 1.88,
"grad_norm": 0.4478554027571998,
"learning_rate": 3.6648762424269306e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735443115234375,
"step": 1175,
"valid_targets_mean": 5188.6,
"valid_targets_min": 2463
},
{
"epoch": 1.888,
"grad_norm": 0.4967663577542887,
"learning_rate": 3.660441328724365e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2868739366531372,
"step": 1180,
"valid_targets_mean": 6199.9,
"valid_targets_min": 2365
},
{
"epoch": 1.896,
"grad_norm": 0.4544842757439779,
"learning_rate": 3.655979982908764e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2722131609916687,
"step": 1185,
"valid_targets_mean": 4829.0,
"valid_targets_min": 1607
},
{
"epoch": 1.904,
"grad_norm": 0.4312917127023269,
"learning_rate": 3.6514922759990756e-05,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30703186988830566,
"step": 1190,
"valid_targets_mean": 5894.9,
"valid_targets_min": 2382
},
{
"epoch": 1.912,
"grad_norm": 0.4773885555314306,
"learning_rate": 3.646978279433883e-05,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275803804397583,
"step": 1195,
"valid_targets_mean": 5051.6,
"valid_targets_min": 2287
},
{
"epoch": 1.92,
"grad_norm": 0.4441897580352912,
"learning_rate": 3.6424380650702685e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2826846241950989,
"step": 1200,
"valid_targets_mean": 5370.1,
"valid_targets_min": 1760
},
{
"epoch": 1.928,
"grad_norm": 0.4612436316301898,
"learning_rate": 3.637871705182667e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725675702095032,
"step": 1205,
"valid_targets_mean": 4786.4,
"valid_targets_min": 2658
},
{
"epoch": 1.936,
"grad_norm": 0.5513342663258486,
"learning_rate": 3.633279272461717e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3400229513645172,
"step": 1210,
"valid_targets_mean": 5965.6,
"valid_targets_min": 833
},
{
"epoch": 1.944,
"grad_norm": 0.4419992875343551,
"learning_rate": 3.628660840013102e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2913501262664795,
"step": 1215,
"valid_targets_mean": 5585.3,
"valid_targets_min": 2383
},
{
"epoch": 1.952,
"grad_norm": 0.4328857845662596,
"learning_rate": 3.624016481356392e-05,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29528385400772095,
"step": 1220,
"valid_targets_mean": 5912.7,
"valid_targets_min": 3592
},
{
"epoch": 1.96,
"grad_norm": 0.4729340584130962,
"learning_rate": 3.619346270423866e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3194947838783264,
"step": 1225,
"valid_targets_mean": 5515.3,
"valid_targets_min": 2746
},
{
"epoch": 1.968,
"grad_norm": 0.42437072854473223,
"learning_rate": 3.6146502815593384e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815873622894287,
"step": 1230,
"valid_targets_mean": 5601.3,
"valid_targets_min": 2488
},
{
"epoch": 1.976,
"grad_norm": 0.41289542578032434,
"learning_rate": 3.609928589516977e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931348979473114,
"step": 1235,
"valid_targets_mean": 6282.1,
"valid_targets_min": 863
},
{
"epoch": 1.984,
"grad_norm": 0.5321386208096575,
"learning_rate": 3.6051812694601114e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28520435094833374,
"step": 1240,
"valid_targets_mean": 6663.6,
"valid_targets_min": 2058
},
{
"epoch": 1.992,
"grad_norm": 0.482697618696399,
"learning_rate": 3.6004083969600346e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983943223953247,
"step": 1245,
"valid_targets_mean": 4540.4,
"valid_targets_min": 834
},
{
"epoch": 2.0,
"grad_norm": 0.49192629172974606,
"learning_rate": 3.595610047994804e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2858894169330597,
"step": 1250,
"valid_targets_mean": 5028.2,
"valid_targets_min": 1660
},
{
"epoch": 2.008,
"grad_norm": 0.4359872718221418,
"learning_rate": 3.5907862989480285e-05,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2697839140892029,
"step": 1255,
"valid_targets_mean": 7249.1,
"valid_targets_min": 2496
},
{
"epoch": 2.016,
"grad_norm": 0.45859795145980614,
"learning_rate": 3.585937226607656e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.279720664024353,
"step": 1260,
"valid_targets_mean": 5313.3,
"valid_targets_min": 2647
},
{
"epoch": 2.024,
"grad_norm": 0.4505438704272417,
"learning_rate": 3.5810629081647476e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788507044315338,
"step": 1265,
"valid_targets_mean": 6312.9,
"valid_targets_min": 2771
},
{
"epoch": 2.032,
"grad_norm": 0.4691711148608988,
"learning_rate": 3.576163421212249e-05,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2736594080924988,
"step": 1270,
"valid_targets_mean": 4661.1,
"valid_targets_min": 578
},
{
"epoch": 2.04,
"grad_norm": 0.5037167340395163,
"learning_rate": 3.5712388437437576e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533131241798401,
"step": 1275,
"valid_targets_mean": 5276.2,
"valid_targets_min": 3433
},
{
"epoch": 2.048,
"grad_norm": 0.42546930787191156,
"learning_rate": 3.566289254152283e-05,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2628275752067566,
"step": 1280,
"valid_targets_mean": 6090.3,
"valid_targets_min": 3340
},
{
"epoch": 2.056,
"grad_norm": 0.42930908716917526,
"learning_rate": 3.56131473122899e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27324312925338745,
"step": 1285,
"valid_targets_mean": 5684.6,
"valid_targets_min": 766
},
{
"epoch": 2.064,
"grad_norm": 0.49385851729689484,
"learning_rate": 3.556315354161955e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26746314764022827,
"step": 1290,
"valid_targets_mean": 5008.8,
"valid_targets_min": 2139
},
{
"epoch": 2.072,
"grad_norm": 0.4391947070222829,
"learning_rate": 3.551291202534899e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27265650033950806,
"step": 1295,
"valid_targets_mean": 5607.2,
"valid_targets_min": 2190
},
{
"epoch": 2.08,
"grad_norm": 0.4582254368398922,
"learning_rate": 3.546242356325922e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865563631057739,
"step": 1300,
"valid_targets_mean": 5633.8,
"valid_targets_min": 687
},
{
"epoch": 2.088,
"grad_norm": 0.4293498674993555,
"learning_rate": 3.5411688959062323e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655894458293915,
"step": 1305,
"valid_targets_mean": 5344.7,
"valid_targets_min": 2540
},
{
"epoch": 2.096,
"grad_norm": 0.4332699663002504,
"learning_rate": 3.5360709020388625e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2839583158493042,
"step": 1310,
"valid_targets_mean": 6193.4,
"valid_targets_min": 2130
},
{
"epoch": 2.104,
"grad_norm": 0.4796757683247767,
"learning_rate": 3.530948455877388e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717803120613098,
"step": 1315,
"valid_targets_mean": 5138.0,
"valid_targets_min": 2010
},
{
"epoch": 2.112,
"grad_norm": 0.474723248917543,
"learning_rate": 3.525801638964634e-05,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3030173182487488,
"step": 1320,
"valid_targets_mean": 5644.9,
"valid_targets_min": 1939
},
{
"epoch": 2.12,
"grad_norm": 0.41894104802521787,
"learning_rate": 3.520630533231376e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30031317472457886,
"step": 1325,
"valid_targets_mean": 6236.9,
"valid_targets_min": 2499
},
{
"epoch": 2.128,
"grad_norm": 0.44950239662521674,
"learning_rate": 3.5154352209950376e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29977887868881226,
"step": 1330,
"valid_targets_mean": 6185.9,
"valid_targets_min": 2168
},
{
"epoch": 2.136,
"grad_norm": 0.43075680464817284,
"learning_rate": 3.510215784958376e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25842052698135376,
"step": 1335,
"valid_targets_mean": 5626.4,
"valid_targets_min": 2212
},
{
"epoch": 2.144,
"grad_norm": 0.4015925556150186,
"learning_rate": 3.5049723082081755e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2656909227371216,
"step": 1340,
"valid_targets_mean": 7547.5,
"valid_targets_min": 4034
},
{
"epoch": 2.152,
"grad_norm": 0.43393949690284467,
"learning_rate": 3.49970487421391e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3003223240375519,
"step": 1345,
"valid_targets_mean": 6083.6,
"valid_targets_min": 1981
},
{
"epoch": 2.16,
"grad_norm": 0.43827694971056175,
"learning_rate": 3.494413566826427e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26340213418006897,
"step": 1350,
"valid_targets_mean": 6010.8,
"valid_targets_min": 1962
},
{
"epoch": 2.168,
"grad_norm": 0.40727563091955427,
"learning_rate": 3.489098470276608e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2752530574798584,
"step": 1355,
"valid_targets_mean": 6446.7,
"valid_targets_min": 2515
},
{
"epoch": 2.176,
"grad_norm": 0.4075018940370257,
"learning_rate": 3.483759669174024e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2670140266418457,
"step": 1360,
"valid_targets_mean": 6044.2,
"valid_targets_min": 2033
},
{
"epoch": 2.184,
"grad_norm": 0.4458150382743038,
"learning_rate": 3.478397248505598e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28183412551879883,
"step": 1365,
"valid_targets_mean": 5179.1,
"valid_targets_min": 2292
},
{
"epoch": 2.192,
"grad_norm": 0.441118210464986,
"learning_rate": 3.473011293634241e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2754057049751282,
"step": 1370,
"valid_targets_mean": 5369.0,
"valid_targets_min": 582
},
{
"epoch": 2.2,
"grad_norm": 0.4614185627987562,
"learning_rate": 3.467601890297502e-05,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30023840069770813,
"step": 1375,
"valid_targets_mean": 6044.8,
"valid_targets_min": 2461
},
{
"epoch": 2.208,
"grad_norm": 0.4493461757147211,
"learning_rate": 3.4621691246061976e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2876693606376648,
"step": 1380,
"valid_targets_mean": 6722.2,
"valid_targets_min": 2520
},
{
"epoch": 2.216,
"grad_norm": 0.5466147214995866,
"learning_rate": 3.456713083043046e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2818297743797302,
"step": 1385,
"valid_targets_mean": 6499.2,
"valid_targets_min": 2419
},
{
"epoch": 2.224,
"grad_norm": 0.41989719260316044,
"learning_rate": 3.451233852461285e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30823421478271484,
"step": 1390,
"valid_targets_mean": 6820.2,
"valid_targets_min": 3289
},
{
"epoch": 2.232,
"grad_norm": 0.43771545385689653,
"learning_rate": 3.4457315200832935e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2757190465927124,
"step": 1395,
"valid_targets_mean": 5641.8,
"valid_targets_min": 2220
},
{
"epoch": 2.24,
"grad_norm": 0.4799367692033165,
"learning_rate": 3.440206173499201e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28247034549713135,
"step": 1400,
"valid_targets_mean": 5592.2,
"valid_targets_min": 3292
},
{
"epoch": 2.248,
"grad_norm": 0.43043323612593953,
"learning_rate": 3.4346579006654945e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2743549048900604,
"step": 1405,
"valid_targets_mean": 5858.2,
"valid_targets_min": 2022
},
{
"epoch": 2.2560000000000002,
"grad_norm": 0.4205959013545583,
"learning_rate": 3.4290867899036166e-05,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30858612060546875,
"step": 1410,
"valid_targets_mean": 6465.2,
"valid_targets_min": 3118
},
{
"epoch": 2.2640000000000002,
"grad_norm": 0.3702037241290151,
"learning_rate": 3.4234929298985614e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27199870347976685,
"step": 1415,
"valid_targets_mean": 6840.3,
"valid_targets_min": 3274
},
{
"epoch": 2.2720000000000002,
"grad_norm": 0.49042099459027266,
"learning_rate": 3.417876409697463e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2543753981590271,
"step": 1420,
"valid_targets_mean": 4505.9,
"valid_targets_min": 627
},
{
"epoch": 2.2800000000000002,
"grad_norm": 0.4676067529924004,
"learning_rate": 3.412237318708175e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3017064929008484,
"step": 1425,
"valid_targets_mean": 5715.6,
"valid_targets_min": 2442
},
{
"epoch": 2.288,
"grad_norm": 0.44794340952190315,
"learning_rate": 3.4065757466978504e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2632843852043152,
"step": 1430,
"valid_targets_mean": 5181.3,
"valid_targets_min": 737
},
{
"epoch": 2.296,
"grad_norm": 0.4515048985651608,
"learning_rate": 3.400891783791511e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26894891262054443,
"step": 1435,
"valid_targets_mean": 5134.5,
"valid_targets_min": 2738
},
{
"epoch": 2.304,
"grad_norm": 0.4210263389946454,
"learning_rate": 3.395185520470614e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2625139355659485,
"step": 1440,
"valid_targets_mean": 5573.9,
"valid_targets_min": 2412
},
{
"epoch": 2.312,
"grad_norm": 0.45646353517684174,
"learning_rate": 3.38945704757161e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29955101013183594,
"step": 1445,
"valid_targets_mean": 4880.6,
"valid_targets_min": 2246
},
{
"epoch": 2.32,
"grad_norm": 0.4648922907575776,
"learning_rate": 3.383706456284498e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535097897052765,
"step": 1450,
"valid_targets_mean": 4900.8,
"valid_targets_min": 2258
},
{
"epoch": 2.328,
"grad_norm": 0.414919522096783,
"learning_rate": 3.377933838151374e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27614641189575195,
"step": 1455,
"valid_targets_mean": 5782.2,
"valid_targets_min": 2233
},
{
"epoch": 2.336,
"grad_norm": 0.4721401237719625,
"learning_rate": 3.3721392850649714e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.279009073972702,
"step": 1460,
"valid_targets_mean": 5091.2,
"valid_targets_min": 2956
},
{
"epoch": 2.344,
"grad_norm": 0.3980236596511246,
"learning_rate": 3.3663228892672034e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30130547285079956,
"step": 1465,
"valid_targets_mean": 6822.2,
"valid_targets_min": 1767
},
{
"epoch": 2.352,
"grad_norm": 0.4411737648188492,
"learning_rate": 3.36048474334769e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28683120012283325,
"step": 1470,
"valid_targets_mean": 5142.1,
"valid_targets_min": 921
},
{
"epoch": 2.36,
"grad_norm": 0.40418223383565033,
"learning_rate": 3.3546249402422834e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27696824073791504,
"step": 1475,
"valid_targets_mean": 6867.9,
"valid_targets_min": 2408
},
{
"epoch": 2.368,
"grad_norm": 0.4328314194872318,
"learning_rate": 3.3487435732315944e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26666712760925293,
"step": 1480,
"valid_targets_mean": 5044.9,
"valid_targets_min": 1312
},
{
"epoch": 2.376,
"grad_norm": 0.4188243659370168,
"learning_rate": 3.342840735939501e-05,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27887147665023804,
"step": 1485,
"valid_targets_mean": 6185.2,
"valid_targets_min": 3188
},
{
"epoch": 2.384,
"grad_norm": 0.4525280463154427,
"learning_rate": 3.33691652233166e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2639387249946594,
"step": 1490,
"valid_targets_mean": 5238.1,
"valid_targets_min": 2297
},
{
"epoch": 2.392,
"grad_norm": 0.40754755046085145,
"learning_rate": 3.330971026714016e-05,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27780595421791077,
"step": 1495,
"valid_targets_mean": 5899.4,
"valid_targets_min": 961
},
{
"epoch": 2.4,
"grad_norm": 0.45449778937356167,
"learning_rate": 3.325004343731292e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2731771469116211,
"step": 1500,
"valid_targets_mean": 5282.1,
"valid_targets_min": 2451
},
{
"epoch": 2.408,
"grad_norm": 0.41936217467238024,
"learning_rate": 3.3190165683654885e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833578586578369,
"step": 1505,
"valid_targets_mean": 5853.5,
"valid_targets_min": 2398
},
{
"epoch": 2.416,
"grad_norm": 0.47309565281866045,
"learning_rate": 3.31300779593437e-05,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796747386455536,
"step": 1510,
"valid_targets_mean": 5078.4,
"valid_targets_min": 1543
},
{
"epoch": 2.424,
"grad_norm": 0.4177225202562232,
"learning_rate": 3.306978122089948e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24066470563411713,
"step": 1515,
"valid_targets_mean": 5414.7,
"valid_targets_min": 2838
},
{
"epoch": 2.432,
"grad_norm": 0.39007343307685954,
"learning_rate": 3.300927642816957e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2647990882396698,
"step": 1520,
"valid_targets_mean": 7182.4,
"valid_targets_min": 3833
},
{
"epoch": 2.44,
"grad_norm": 0.4766268290914442,
"learning_rate": 3.294856454431328e-05,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2947763502597809,
"step": 1525,
"valid_targets_mean": 5058.1,
"valid_targets_min": 740
},
{
"epoch": 2.448,
"grad_norm": 0.4749676704997854,
"learning_rate": 3.288764653578653e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2593019902706146,
"step": 1530,
"valid_targets_mean": 5531.9,
"valid_targets_min": 3211
},
{
"epoch": 2.456,
"grad_norm": 0.43087832321512626,
"learning_rate": 3.2826523372326516e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759775221347809,
"step": 1535,
"valid_targets_mean": 5525.2,
"valid_targets_min": 2348
},
{
"epoch": 2.464,
"grad_norm": 0.4144418282536644,
"learning_rate": 3.276519602693621e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2653999924659729,
"step": 1540,
"valid_targets_mean": 5352.9,
"valid_targets_min": 542
},
{
"epoch": 2.472,
"grad_norm": 0.42435435381093956,
"learning_rate": 3.270366547586892e-05,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2846945524215698,
"step": 1545,
"valid_targets_mean": 5556.9,
"valid_targets_min": 2818
},
{
"epoch": 2.48,
"grad_norm": 0.46730653220343593,
"learning_rate": 3.2641932698612715e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27474409341812134,
"step": 1550,
"valid_targets_mean": 4989.6,
"valid_targets_min": 3049
},
{
"epoch": 2.488,
"grad_norm": 0.4484239721050301,
"learning_rate": 3.2579998677874855e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688925862312317,
"step": 1555,
"valid_targets_mean": 5152.9,
"valid_targets_min": 744
},
{
"epoch": 2.496,
"grad_norm": 0.45786906944884076,
"learning_rate": 3.251786439956614e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26745644211769104,
"step": 1560,
"valid_targets_mean": 4496.0,
"valid_targets_min": 834
},
{
"epoch": 2.504,
"grad_norm": 0.5706239065761335,
"learning_rate": 3.2455530852785206e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29573023319244385,
"step": 1565,
"valid_targets_mean": 3546.1,
"valid_targets_min": 536
},
{
"epoch": 2.512,
"grad_norm": 0.4660476242711952,
"learning_rate": 3.239299902980281e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2543278634548187,
"step": 1570,
"valid_targets_mean": 4862.9,
"valid_targets_min": 2734
},
{
"epoch": 2.52,
"grad_norm": 0.42408248225968304,
"learning_rate": 3.2330269926046e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2651727795600891,
"step": 1575,
"valid_targets_mean": 5785.1,
"valid_targets_min": 1938
},
{
"epoch": 2.528,
"grad_norm": 0.4129023020912163,
"learning_rate": 3.2267344540082284e-05,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28441861271858215,
"step": 1580,
"valid_targets_mean": 5624.2,
"valid_targets_min": 1104
},
{
"epoch": 2.536,
"grad_norm": 0.41229447790684026,
"learning_rate": 3.220422387360373e-05,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966400980949402,
"step": 1585,
"valid_targets_mean": 6064.5,
"valid_targets_min": 711
},
{
"epoch": 2.544,
"grad_norm": 0.3940473278014604,
"learning_rate": 3.2140908931411026e-05,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2629774510860443,
"step": 1590,
"valid_targets_mean": 6014.9,
"valid_targets_min": 2710
},
{
"epoch": 2.552,
"grad_norm": 0.48235415015990013,
"learning_rate": 3.207740072139748e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27599039673805237,
"step": 1595,
"valid_targets_mean": 4336.2,
"valid_targets_min": 676
},
{
"epoch": 2.56,
"grad_norm": 0.43812989181014855,
"learning_rate": 3.2013700254532996e-05,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2840218245983124,
"step": 1600,
"valid_targets_mean": 6128.1,
"valid_targets_min": 2306
},
{
"epoch": 2.568,
"grad_norm": 0.4421391095546585,
"learning_rate": 3.194980854484794e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2730617821216583,
"step": 1605,
"valid_targets_mean": 5236.0,
"valid_targets_min": 2238
},
{
"epoch": 2.576,
"grad_norm": 0.40993966192632497,
"learning_rate": 3.188572660941702e-05,
"loss": 0.2737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2702597379684448,
"step": 1610,
"valid_targets_mean": 5520.4,
"valid_targets_min": 1951
},
{
"epoch": 2.584,
"grad_norm": 0.449106850254283,
"learning_rate": 3.182145546834311e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2685029208660126,
"step": 1615,
"valid_targets_mean": 5474.4,
"valid_targets_min": 1011
},
{
"epoch": 2.592,
"grad_norm": 0.43609694783076547,
"learning_rate": 3.1756996144740994e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26621997356414795,
"step": 1620,
"valid_targets_mean": 5704.4,
"valid_targets_min": 2305
},
{
"epoch": 2.6,
"grad_norm": 0.437600515095227,
"learning_rate": 3.1692349664721074e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2866860032081604,
"step": 1625,
"valid_targets_mean": 6387.4,
"valid_targets_min": 2588
},
{
"epoch": 2.608,
"grad_norm": 0.4758070327306289,
"learning_rate": 3.1627517057373046e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27016139030456543,
"step": 1630,
"valid_targets_mean": 5040.3,
"valid_targets_min": 804
},
{
"epoch": 2.616,
"grad_norm": 0.5050945646090564,
"learning_rate": 3.156249935474953e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27052950859069824,
"step": 1635,
"valid_targets_mean": 5326.6,
"valid_targets_min": 2368
},
{
"epoch": 2.624,
"grad_norm": 0.39592620562061526,
"learning_rate": 3.1497297591849614e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26756832003593445,
"step": 1640,
"valid_targets_mean": 6438.1,
"valid_targets_min": 970
},
{
"epoch": 2.632,
"grad_norm": 0.47399414052636385,
"learning_rate": 3.143191280660238e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3013014495372772,
"step": 1645,
"valid_targets_mean": 5066.2,
"valid_targets_min": 2808
},
{
"epoch": 2.64,
"grad_norm": 0.4498456912539592,
"learning_rate": 3.1366346039850424e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3045828938484192,
"step": 1650,
"valid_targets_mean": 5521.9,
"valid_targets_min": 585
},
{
"epoch": 2.648,
"grad_norm": 0.495309465433173,
"learning_rate": 3.130059833533323e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30020833015441895,
"step": 1655,
"valid_targets_mean": 4797.9,
"valid_targets_min": 564
},
{
"epoch": 2.656,
"grad_norm": 0.4297894353894199,
"learning_rate": 3.123467073967059e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2691328823566437,
"step": 1660,
"valid_targets_mean": 6277.9,
"valid_targets_min": 3682
},
{
"epoch": 2.664,
"grad_norm": 0.45151420932528674,
"learning_rate": 3.116856430234594e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2929932773113251,
"step": 1665,
"valid_targets_mean": 6091.2,
"valid_targets_min": 1280
},
{
"epoch": 2.672,
"grad_norm": 0.4255273252520274,
"learning_rate": 3.110228007568963e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2611987590789795,
"step": 1670,
"valid_targets_mean": 5407.6,
"valid_targets_min": 2936
},
{
"epoch": 2.68,
"grad_norm": 0.41326123258834,
"learning_rate": 3.103581911486221e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2713870704174042,
"step": 1675,
"valid_targets_mean": 5890.7,
"valid_targets_min": 3319
},
{
"epoch": 2.6879999999999997,
"grad_norm": 0.42906521181729274,
"learning_rate": 3.0969182477837604e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2987547516822815,
"step": 1680,
"valid_targets_mean": 6719.4,
"valid_targets_min": 797
},
{
"epoch": 2.6959999999999997,
"grad_norm": 0.4651035568357889,
"learning_rate": 3.090237122538628e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2748391032218933,
"step": 1685,
"valid_targets_mean": 4811.9,
"valid_targets_min": 1835
},
{
"epoch": 2.7039999999999997,
"grad_norm": 0.4526858770407024,
"learning_rate": 3.0835386421058345e-05,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2757079303264618,
"step": 1690,
"valid_targets_mean": 5114.1,
"valid_targets_min": 1825
},
{
"epoch": 2.7119999999999997,
"grad_norm": 0.4303883323426744,
"learning_rate": 3.0768229131166664e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27044957876205444,
"step": 1695,
"valid_targets_mean": 5952.2,
"valid_targets_min": 2348
},
{
"epoch": 2.7199999999999998,
"grad_norm": 0.421293283882041,
"learning_rate": 3.070090042476983e-05,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537495195865631,
"step": 1700,
"valid_targets_mean": 5275.4,
"valid_targets_min": 2820
},
{
"epoch": 2.7279999999999998,
"grad_norm": 0.42070620075383014,
"learning_rate": 3.063340137365517e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26784974336624146,
"step": 1705,
"valid_targets_mean": 6155.7,
"valid_targets_min": 2833
},
{
"epoch": 2.7359999999999998,
"grad_norm": 0.46160330069058947,
"learning_rate": 3.0565733052321674e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010793924331665,
"step": 1710,
"valid_targets_mean": 5182.6,
"valid_targets_min": 766
},
{
"epoch": 2.7439999999999998,
"grad_norm": 0.47565115114958284,
"learning_rate": 3.0497896537962924e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29553931951522827,
"step": 1715,
"valid_targets_mean": 4856.3,
"valid_targets_min": 2348
},
{
"epoch": 2.752,
"grad_norm": 0.47758063053303274,
"learning_rate": 3.042989291044991e-05,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2923269271850586,
"step": 1720,
"valid_targets_mean": 4834.2,
"valid_targets_min": 604
},
{
"epoch": 2.76,
"grad_norm": 0.44821402221279694,
"learning_rate": 3.036172325231383e-05,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27335962653160095,
"step": 1725,
"valid_targets_mean": 5101.4,
"valid_targets_min": 2237
},
{
"epoch": 2.768,
"grad_norm": 0.40899132950092204,
"learning_rate": 3.0293388648728908e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26575198769569397,
"step": 1730,
"valid_targets_mean": 5682.9,
"valid_targets_min": 3293
},
{
"epoch": 2.776,
"grad_norm": 0.4748210406966679,
"learning_rate": 3.022489018749508e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28260117769241333,
"step": 1735,
"valid_targets_mean": 5148.7,
"valid_targets_min": 659
},
{
"epoch": 2.784,
"grad_norm": 0.4349828443150829,
"learning_rate": 3.015622895902068e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29926276206970215,
"step": 1740,
"valid_targets_mean": 5951.7,
"valid_targets_min": 532
},
{
"epoch": 2.792,
"grad_norm": 0.4101951619425804,
"learning_rate": 3.008740605630508e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27278026938438416,
"step": 1745,
"valid_targets_mean": 6255.8,
"valid_targets_min": 2383
},
{
"epoch": 2.8,
"grad_norm": 0.43886743945375883,
"learning_rate": 3.0018422574921337e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27373838424682617,
"step": 1750,
"valid_targets_mean": 6037.8,
"valid_targets_min": 2287
},
{
"epoch": 2.808,
"grad_norm": 0.46273862132614424,
"learning_rate": 2.9949279612998673e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563420534133911,
"step": 1755,
"valid_targets_mean": 5141.6,
"valid_targets_min": 2334
},
{
"epoch": 2.816,
"grad_norm": 0.42084337553867707,
"learning_rate": 2.9879978271205064e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631978392601013,
"step": 1760,
"valid_targets_mean": 5481.5,
"valid_targets_min": 2358
},
{
"epoch": 2.824,
"grad_norm": 0.4226323080765043,
"learning_rate": 2.9810519652729692e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27294427156448364,
"step": 1765,
"valid_targets_mean": 5862.9,
"valid_targets_min": 2158
},
{
"epoch": 2.832,
"grad_norm": 0.4133165678616725,
"learning_rate": 2.9740904863265378e-05,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25264087319374084,
"step": 1770,
"valid_targets_mean": 5787.2,
"valid_targets_min": 2246
},
{
"epoch": 2.84,
"grad_norm": 0.44849937220188063,
"learning_rate": 2.967113501099097e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32316309213638306,
"step": 1775,
"valid_targets_mean": 5906.6,
"valid_targets_min": 4056
},
{
"epoch": 2.848,
"grad_norm": 0.42817162546087406,
"learning_rate": 2.9601211206553745e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26556289196014404,
"step": 1780,
"valid_targets_mean": 5367.5,
"valid_targets_min": 845
},
{
"epoch": 2.856,
"grad_norm": 0.38768874404245973,
"learning_rate": 2.9531134563051686e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2648174464702606,
"step": 1785,
"valid_targets_mean": 6421.1,
"valid_targets_min": 2438
},
{
"epoch": 2.864,
"grad_norm": 0.4047385059000395,
"learning_rate": 2.946090619601579e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2702750265598297,
"step": 1790,
"valid_targets_mean": 6062.8,
"valid_targets_min": 2828
},
{
"epoch": 2.872,
"grad_norm": 0.4481184534104384,
"learning_rate": 2.9390527223392292e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30734002590179443,
"step": 1795,
"valid_targets_mean": 5348.5,
"valid_targets_min": 851
},
{
"epoch": 2.88,
"grad_norm": 0.4358783108651049,
"learning_rate": 2.931999876552488e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29541853070259094,
"step": 1800,
"valid_targets_mean": 5955.2,
"valid_targets_min": 3117
},
{
"epoch": 2.888,
"grad_norm": 0.3874182891708397,
"learning_rate": 2.9249321945136854e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845751643180847,
"step": 1805,
"valid_targets_mean": 7245.1,
"valid_targets_min": 2606
},
{
"epoch": 2.896,
"grad_norm": 0.42410801990986086,
"learning_rate": 2.9178497887313257e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27056288719177246,
"step": 1810,
"valid_targets_mean": 5659.6,
"valid_targets_min": 1996
},
{
"epoch": 2.904,
"grad_norm": 0.46595265901950295,
"learning_rate": 2.9107527719482968e-05,
"loss": 0.2775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27986976504325867,
"step": 1815,
"valid_targets_mean": 5373.6,
"valid_targets_min": 1951
},
{
"epoch": 2.912,
"grad_norm": 0.4402020755344616,
"learning_rate": 2.9036412571400747e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562943696975708,
"step": 1820,
"valid_targets_mean": 5127.8,
"valid_targets_min": 2872
},
{
"epoch": 2.92,
"grad_norm": 0.3805031455186279,
"learning_rate": 2.8965153575129255e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894074320793152,
"step": 1825,
"valid_targets_mean": 7028.5,
"valid_targets_min": 3875
},
{
"epoch": 2.928,
"grad_norm": 0.4460246697987472,
"learning_rate": 2.8893751865021044e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25859567523002625,
"step": 1830,
"valid_targets_mean": 5250.1,
"valid_targets_min": 1151
},
{
"epoch": 2.936,
"grad_norm": 0.40198594148376793,
"learning_rate": 2.8822208577700473e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24994345009326935,
"step": 1835,
"valid_targets_mean": 5900.0,
"valid_targets_min": 2878
},
{
"epoch": 2.944,
"grad_norm": 0.45652338078801363,
"learning_rate": 2.8750524852045642e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3019225001335144,
"step": 1840,
"valid_targets_mean": 5770.6,
"valid_targets_min": 793
},
{
"epoch": 2.952,
"grad_norm": 0.3891949461136039,
"learning_rate": 2.867870182917024e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2574838697910309,
"step": 1845,
"valid_targets_mean": 5976.9,
"valid_targets_min": 2672
},
{
"epoch": 2.96,
"grad_norm": 0.4372813649278471,
"learning_rate": 2.8606740652405394e-05,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29001131653785706,
"step": 1850,
"valid_targets_mean": 5360.3,
"valid_targets_min": 3093
},
{
"epoch": 2.968,
"grad_norm": 0.4165914393492165,
"learning_rate": 2.853464246728147e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655784785747528,
"step": 1855,
"valid_targets_mean": 5410.2,
"valid_targets_min": 2130
},
{
"epoch": 2.976,
"grad_norm": 0.4008129134672245,
"learning_rate": 2.846240842150984e-05,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29392343759536743,
"step": 1860,
"valid_targets_mean": 6621.4,
"valid_targets_min": 2007
},
{
"epoch": 2.984,
"grad_norm": 0.4063502231247828,
"learning_rate": 2.839003966496458e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830163538455963,
"step": 1865,
"valid_targets_mean": 7332.2,
"valid_targets_min": 2647
},
{
"epoch": 2.992,
"grad_norm": 0.41454228214125255,
"learning_rate": 2.8317537349664215e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.300517737865448,
"step": 1870,
"valid_targets_mean": 6810.3,
"valid_targets_min": 1725
},
{
"epoch": 3.0,
"grad_norm": 0.3811043034757187,
"learning_rate": 2.824490262975334e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567134201526642,
"step": 1875,
"valid_targets_mean": 6309.3,
"valid_targets_min": 2837
},
{
"epoch": 3.008,
"grad_norm": 0.44986998163213937,
"learning_rate": 2.817213666148427e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562277913093567,
"step": 1880,
"valid_targets_mean": 4919.7,
"valid_targets_min": 2287
},
{
"epoch": 3.016,
"grad_norm": 0.39188395180907326,
"learning_rate": 2.809924060319862e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24832743406295776,
"step": 1885,
"valid_targets_mean": 5902.5,
"valid_targets_min": 2527
},
{
"epoch": 3.024,
"grad_norm": 0.44868780761237514,
"learning_rate": 2.802621561530888e-05,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2716829776763916,
"step": 1890,
"valid_targets_mean": 5865.4,
"valid_targets_min": 1532
},
{
"epoch": 3.032,
"grad_norm": 0.49232768631488905,
"learning_rate": 2.7953062860279937e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.254425048828125,
"step": 1895,
"valid_targets_mean": 4952.2,
"valid_targets_min": 2359
},
{
"epoch": 3.04,
"grad_norm": 0.39705870685465516,
"learning_rate": 2.7879783502610557e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26486480236053467,
"step": 1900,
"valid_targets_mean": 5991.8,
"valid_targets_min": 2506
},
{
"epoch": 3.048,
"grad_norm": 0.4103910836926923,
"learning_rate": 2.7806378708814875e-05,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2603754699230194,
"step": 1905,
"valid_targets_mean": 5866.4,
"valid_targets_min": 3445
},
{
"epoch": 3.056,
"grad_norm": 0.4404796718903863,
"learning_rate": 2.773284964740379e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25497716665267944,
"step": 1910,
"valid_targets_mean": 5420.9,
"valid_targets_min": 2347
},
{
"epoch": 3.064,
"grad_norm": 0.4595279784055635,
"learning_rate": 2.7659197488866403e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2736179828643799,
"step": 1915,
"valid_targets_mean": 5122.2,
"valid_targets_min": 977
},
{
"epoch": 3.072,
"grad_norm": 0.47456111645753335,
"learning_rate": 2.7585423405651347e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2576856017112732,
"step": 1920,
"valid_targets_mean": 4942.1,
"valid_targets_min": 2950
},
{
"epoch": 3.08,
"grad_norm": 0.43777645624232037,
"learning_rate": 2.7511528572148153e-05,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27957212924957275,
"step": 1925,
"valid_targets_mean": 5275.7,
"valid_targets_min": 1870
},
{
"epoch": 3.088,
"grad_norm": 0.4522466576604798,
"learning_rate": 2.7437514164668536e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531649172306061,
"step": 1930,
"valid_targets_mean": 4698.0,
"valid_targets_min": 1760
},
{
"epoch": 3.096,
"grad_norm": 0.4424402462760102,
"learning_rate": 2.7363381361427692e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2742995023727417,
"step": 1935,
"valid_targets_mean": 5695.1,
"valid_targets_min": 2581
},
{
"epoch": 3.104,
"grad_norm": 0.4157664621751824,
"learning_rate": 2.72891313425255e-05,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25712645053863525,
"step": 1940,
"valid_targets_mean": 5666.0,
"valid_targets_min": 2670
},
{
"epoch": 3.112,
"grad_norm": 0.4448020926912599,
"learning_rate": 2.7214765289927777e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533559501171112,
"step": 1945,
"valid_targets_mean": 4905.4,
"valid_targets_min": 2204
},
{
"epoch": 3.12,
"grad_norm": 0.4416757344594968,
"learning_rate": 2.714028438744746e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23446297645568848,
"step": 1950,
"valid_targets_mean": 4820.4,
"valid_targets_min": 3010
},
{
"epoch": 3.128,
"grad_norm": 0.99132804143127,
"learning_rate": 2.706568982072573e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25379735231399536,
"step": 1955,
"valid_targets_mean": 4584.4,
"valid_targets_min": 2042
},
{
"epoch": 3.136,
"grad_norm": 0.37723732371353097,
"learning_rate": 2.6990982777213174e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2723168730735779,
"step": 1960,
"valid_targets_mean": 6596.4,
"valid_targets_min": 840
},
{
"epoch": 3.144,
"grad_norm": 0.4271097743973345,
"learning_rate": 2.691616444615085e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26200491189956665,
"step": 1965,
"valid_targets_mean": 6096.9,
"valid_targets_min": 3143
},
{
"epoch": 3.152,
"grad_norm": 0.41531856969368103,
"learning_rate": 2.6841236018551402e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260453999042511,
"step": 1970,
"valid_targets_mean": 5445.1,
"valid_targets_min": 563
},
{
"epoch": 3.16,
"grad_norm": 0.4417409056500301,
"learning_rate": 2.6766198687180028e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2590559124946594,
"step": 1975,
"valid_targets_mean": 5636.7,
"valid_targets_min": 611
},
{
"epoch": 3.168,
"grad_norm": 0.4422829407193221,
"learning_rate": 2.6691053646535564e-05,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2656911313533783,
"step": 1980,
"valid_targets_mean": 5018.6,
"valid_targets_min": 619
},
{
"epoch": 3.176,
"grad_norm": 0.4237887881247236,
"learning_rate": 2.6615802092831446e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780739963054657,
"step": 1985,
"valid_targets_mean": 5302.7,
"valid_targets_min": 2266
},
{
"epoch": 3.184,
"grad_norm": 0.42380386232725864,
"learning_rate": 2.6540445223976637e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2620670199394226,
"step": 1990,
"valid_targets_mean": 6350.1,
"valid_targets_min": 776
},
{
"epoch": 3.192,
"grad_norm": 0.47180334207154845,
"learning_rate": 2.6464984239556602e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2522035539150238,
"step": 1995,
"valid_targets_mean": 5105.7,
"valid_targets_min": 707
},
{
"epoch": 3.2,
"grad_norm": 0.40590968448904624,
"learning_rate": 2.63894203408142e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2857327163219452,
"step": 2000,
"valid_targets_mean": 6472.3,
"valid_targets_min": 824
},
{
"epoch": 3.208,
"grad_norm": 0.4364196490684295,
"learning_rate": 2.6313754730630528e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018920421600342,
"step": 2005,
"valid_targets_mean": 6931.6,
"valid_targets_min": 3554
},
{
"epoch": 3.216,
"grad_norm": 0.4380123000076932,
"learning_rate": 2.623798861350582e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27944761514663696,
"step": 2010,
"valid_targets_mean": 5875.2,
"valid_targets_min": 1748
},
{
"epoch": 3.224,
"grad_norm": 0.4370825009728502,
"learning_rate": 2.6162123195540247e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28861603140830994,
"step": 2015,
"valid_targets_mean": 5691.7,
"valid_targets_min": 2845
},
{
"epoch": 3.232,
"grad_norm": 0.485452151135628,
"learning_rate": 2.6086159684414726e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2795363664627075,
"step": 2020,
"valid_targets_mean": 4541.8,
"valid_targets_min": 797
},
{
"epoch": 3.24,
"grad_norm": 0.48611407649627225,
"learning_rate": 2.6010099289371694e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25999119877815247,
"step": 2025,
"valid_targets_mean": 4361.3,
"valid_targets_min": 809
},
{
"epoch": 3.248,
"grad_norm": 0.43314259033107916,
"learning_rate": 2.5933943221195844e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27597910165786743,
"step": 2030,
"valid_targets_mean": 5998.9,
"valid_targets_min": 3510
},
{
"epoch": 3.2560000000000002,
"grad_norm": 0.4467889320108032,
"learning_rate": 2.5857692692194884e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27943307161331177,
"step": 2035,
"valid_targets_mean": 6833.2,
"valid_targets_min": 3418
},
{
"epoch": 3.2640000000000002,
"grad_norm": 0.444733214195372,
"learning_rate": 2.5781348916180195e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2452739030122757,
"step": 2040,
"valid_targets_mean": 5335.4,
"valid_targets_min": 2970
},
{
"epoch": 3.2720000000000002,
"grad_norm": 0.4473237438727197,
"learning_rate": 2.570491310844755e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26792657375335693,
"step": 2045,
"valid_targets_mean": 5598.2,
"valid_targets_min": 3002
},
{
"epoch": 3.2800000000000002,
"grad_norm": 0.44916463593865047,
"learning_rate": 2.562838648575774e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25192153453826904,
"step": 2050,
"valid_targets_mean": 5738.1,
"valid_targets_min": 1400
},
{
"epoch": 3.288,
"grad_norm": 0.37869541775803,
"learning_rate": 2.5551770266317224e-05,
"loss": 0.266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2549699544906616,
"step": 2055,
"valid_targets_mean": 6927.1,
"valid_targets_min": 3188
},
{
"epoch": 3.296,
"grad_norm": 0.45381896265008714,
"learning_rate": 2.5475065669758713e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2710186839103699,
"step": 2060,
"valid_targets_mean": 5502.5,
"valid_targets_min": 721
},
{
"epoch": 3.304,
"grad_norm": 0.476208174837823,
"learning_rate": 2.5398273917121786e-05,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721608281135559,
"step": 2065,
"valid_targets_mean": 5169.7,
"valid_targets_min": 2469
},
{
"epoch": 3.312,
"grad_norm": 0.4512021420566415,
"learning_rate": 2.532139623083342e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.280364990234375,
"step": 2070,
"valid_targets_mean": 5583.2,
"valid_targets_min": 759
},
{
"epoch": 3.32,
"grad_norm": 0.43311411478631495,
"learning_rate": 2.5244433834688552e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24803069233894348,
"step": 2075,
"valid_targets_mean": 5230.8,
"valid_targets_min": 2395
},
{
"epoch": 3.328,
"grad_norm": 0.4236542010190115,
"learning_rate": 2.5167387953830602e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26770997047424316,
"step": 2080,
"valid_targets_mean": 5747.2,
"valid_targets_min": 1906
},
{
"epoch": 3.336,
"grad_norm": 0.41233687112752104,
"learning_rate": 2.5090259814731946e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23465529084205627,
"step": 2085,
"valid_targets_mean": 6191.6,
"valid_targets_min": 610
},
{
"epoch": 3.344,
"grad_norm": 0.4301152484815432,
"learning_rate": 2.5013050645174414e-05,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2639310359954834,
"step": 2090,
"valid_targets_mean": 5565.9,
"valid_targets_min": 970
},
{
"epoch": 3.352,
"grad_norm": 0.42805683293361596,
"learning_rate": 2.4935761674229735e-05,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28847432136535645,
"step": 2095,
"valid_targets_mean": 6180.6,
"valid_targets_min": 2325
},
{
"epoch": 3.36,
"grad_norm": 0.4108722186615793,
"learning_rate": 2.4858394132239982e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26170119643211365,
"step": 2100,
"valid_targets_mean": 6346.6,
"valid_targets_min": 3315
},
{
"epoch": 3.368,
"grad_norm": 0.4438984053068301,
"learning_rate": 2.4780949250797964e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2657065987586975,
"step": 2105,
"valid_targets_mean": 5510.9,
"valid_targets_min": 2010
},
{
"epoch": 3.376,
"grad_norm": 0.40828469834181624,
"learning_rate": 2.4703428262727656e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982710003852844,
"step": 2110,
"valid_targets_mean": 6507.9,
"valid_targets_min": 2926
},
{
"epoch": 3.384,
"grad_norm": 0.43104351910647665,
"learning_rate": 2.4625832402064525e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3116433024406433,
"step": 2115,
"valid_targets_mean": 5877.9,
"valid_targets_min": 636
},
{
"epoch": 3.392,
"grad_norm": 0.42418155412882275,
"learning_rate": 2.454816290403595e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540300786495209,
"step": 2120,
"valid_targets_mean": 5527.6,
"valid_targets_min": 2077
},
{
"epoch": 3.4,
"grad_norm": 0.39935339866930863,
"learning_rate": 2.4470421005041492e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25366467237472534,
"step": 2125,
"valid_targets_mean": 5777.4,
"valid_targets_min": 2126
},
{
"epoch": 3.408,
"grad_norm": 0.46642524230649085,
"learning_rate": 2.4392607942633263e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766075134277344,
"step": 2130,
"valid_targets_mean": 5309.3,
"valid_targets_min": 2492
},
{
"epoch": 3.416,
"grad_norm": 0.40542150642600944,
"learning_rate": 2.43147249554962e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2503218352794647,
"step": 2135,
"valid_targets_mean": 5945.4,
"valid_targets_min": 2787
},
{
"epoch": 3.424,
"grad_norm": 0.5003293603533124,
"learning_rate": 2.423677328342835e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269273042678833,
"step": 2140,
"valid_targets_mean": 4656.9,
"valid_targets_min": 2190
},
{
"epoch": 3.432,
"grad_norm": 0.43945562577333586,
"learning_rate": 2.415875416732113e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2691774368286133,
"step": 2145,
"valid_targets_mean": 5574.9,
"valid_targets_min": 2402
},
{
"epoch": 3.44,
"grad_norm": 0.46811613846101446,
"learning_rate": 2.4080668849139603e-05,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26551342010498047,
"step": 2150,
"valid_targets_mean": 5372.2,
"valid_targets_min": 991
},
{
"epoch": 3.448,
"grad_norm": 0.4077015317433029,
"learning_rate": 2.4002518571902665e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25210684537887573,
"step": 2155,
"valid_targets_mean": 5778.7,
"valid_targets_min": 2306
},
{
"epoch": 3.456,
"grad_norm": 0.440624451883909,
"learning_rate": 2.392430457966328e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24545451998710632,
"step": 2160,
"valid_targets_mean": 5699.8,
"valid_targets_min": 2457
},
{
"epoch": 3.464,
"grad_norm": 0.4644597860891612,
"learning_rate": 2.3846028117488686e-05,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2686898410320282,
"step": 2165,
"valid_targets_mean": 5256.7,
"valid_targets_min": 901
},
{
"epoch": 3.472,
"grad_norm": 0.45287734791016193,
"learning_rate": 2.3767690431440533e-05,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28908854722976685,
"step": 2170,
"valid_targets_mean": 6981.8,
"valid_targets_min": 708
},
{
"epoch": 3.48,
"grad_norm": 0.41268646628823424,
"learning_rate": 2.368929276855512e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26175349950790405,
"step": 2175,
"valid_targets_mean": 5828.8,
"valid_targets_min": 2328
},
{
"epoch": 3.488,
"grad_norm": 0.40243049575345696,
"learning_rate": 2.361083637682347e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26664072275161743,
"step": 2180,
"valid_targets_mean": 6444.5,
"valid_targets_min": 2079
},
{
"epoch": 3.496,
"grad_norm": 0.4208581290888113,
"learning_rate": 2.3532322505171502e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26101818680763245,
"step": 2185,
"valid_targets_mean": 5354.2,
"valid_targets_min": 2479
},
{
"epoch": 3.504,
"grad_norm": 0.3953533628663449,
"learning_rate": 2.3453752403440147e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26703381538391113,
"step": 2190,
"valid_targets_mean": 5831.3,
"valid_targets_min": 2203
},
{
"epoch": 3.512,
"grad_norm": 0.38434465715826854,
"learning_rate": 2.337512732236545e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23783396184444427,
"step": 2195,
"valid_targets_mean": 6418.1,
"valid_targets_min": 1104
},
{
"epoch": 3.52,
"grad_norm": 0.43338676646075414,
"learning_rate": 2.3296448513558628e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26993754506111145,
"step": 2200,
"valid_targets_mean": 5462.9,
"valid_targets_min": 640
},
{
"epoch": 3.528,
"grad_norm": 0.4496777907267995,
"learning_rate": 2.321771722948622e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2622802257537842,
"step": 2205,
"valid_targets_mean": 6097.9,
"valid_targets_min": 3581
},
{
"epoch": 3.536,
"grad_norm": 0.41566876544597353,
"learning_rate": 2.3138934723450074e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2877008616924286,
"step": 2210,
"valid_targets_mean": 6912.1,
"valid_targets_min": 2531
},
{
"epoch": 3.544,
"grad_norm": 0.47881534922065505,
"learning_rate": 2.306010224956744e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31302931904792786,
"step": 2215,
"valid_targets_mean": 5172.6,
"valid_targets_min": 970
},
{
"epoch": 3.552,
"grad_norm": 0.4090791008823442,
"learning_rate": 2.2981221062750986e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23748889565467834,
"step": 2220,
"valid_targets_mean": 5436.2,
"valid_targets_min": 3544
},
{
"epoch": 3.56,
"grad_norm": 0.37997502199670286,
"learning_rate": 2.290229241868882e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.251059353351593,
"step": 2225,
"valid_targets_mean": 5980.6,
"valid_targets_min": 687
},
{
"epoch": 3.568,
"grad_norm": 0.3986292880302235,
"learning_rate": 2.282331757382454e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28471672534942627,
"step": 2230,
"valid_targets_mean": 6370.6,
"valid_targets_min": 1941
},
{
"epoch": 3.576,
"grad_norm": 0.431878132975706,
"learning_rate": 2.2744297785337155e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2553999125957489,
"step": 2235,
"valid_targets_mean": 5513.6,
"valid_targets_min": 2046
},
{
"epoch": 3.584,
"grad_norm": 0.4115529559985401,
"learning_rate": 2.2665234311121155e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26266321539878845,
"step": 2240,
"valid_targets_mean": 5916.8,
"valid_targets_min": 2845
},
{
"epoch": 3.592,
"grad_norm": 0.45407655506541134,
"learning_rate": 2.258612840976645e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24577778577804565,
"step": 2245,
"valid_targets_mean": 5146.2,
"valid_targets_min": 2756
},
{
"epoch": 3.6,
"grad_norm": 0.41467217796114125,
"learning_rate": 2.2506981340538315e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26159006357192993,
"step": 2250,
"valid_targets_mean": 5252.8,
"valid_targets_min": 537
},
{
"epoch": 3.608,
"grad_norm": 0.3919567632052263,
"learning_rate": 2.2427794363357384e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2614225745201111,
"step": 2255,
"valid_targets_mean": 6612.1,
"valid_targets_min": 2208
},
{
"epoch": 3.616,
"grad_norm": 0.43278714802298296,
"learning_rate": 2.2348568738779566e-05,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29214614629745483,
"step": 2260,
"valid_targets_mean": 6142.4,
"valid_targets_min": 1847
},
{
"epoch": 3.624,
"grad_norm": 0.4110332083414153,
"learning_rate": 2.2269305727975993e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29854828119277954,
"step": 2265,
"valid_targets_mean": 7177.7,
"valid_targets_min": 3515
},
{
"epoch": 3.632,
"grad_norm": 0.44547325805290383,
"learning_rate": 2.2190006592712927e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26258304715156555,
"step": 2270,
"valid_targets_mean": 5474.2,
"valid_targets_min": 2692
},
{
"epoch": 3.64,
"grad_norm": 0.4614610116421694,
"learning_rate": 2.2110672595331698e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2816447913646698,
"step": 2275,
"valid_targets_mean": 4608.2,
"valid_targets_min": 384
},
{
"epoch": 3.648,
"grad_norm": 0.41303927586822076,
"learning_rate": 2.2031304998728587e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261924684047699,
"step": 2280,
"valid_targets_mean": 5297.2,
"valid_targets_min": 664
},
{
"epoch": 3.656,
"grad_norm": 0.42755844253142716,
"learning_rate": 2.1951905066334737e-05,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275720477104187,
"step": 2285,
"valid_targets_mean": 5888.2,
"valid_targets_min": 2348
},
{
"epoch": 3.664,
"grad_norm": 0.39946995165209875,
"learning_rate": 2.1872474062096046e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27406832575798035,
"step": 2290,
"valid_targets_mean": 6055.6,
"valid_targets_min": 2541
},
{
"epoch": 3.672,
"grad_norm": 0.4286567596359356,
"learning_rate": 2.179301325045301e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26409912109375,
"step": 2295,
"valid_targets_mean": 5746.8,
"valid_targets_min": 1493
},
{
"epoch": 3.68,
"grad_norm": 0.6041261914809137,
"learning_rate": 2.1713523896320647e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26296675205230713,
"step": 2300,
"valid_targets_mean": 5095.0,
"valid_targets_min": 798
},
{
"epoch": 3.6879999999999997,
"grad_norm": 0.4267338339744416,
"learning_rate": 2.163400726506832e-05,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24727872014045715,
"step": 2305,
"valid_targets_mean": 5302.2,
"valid_targets_min": 2620
},
{
"epoch": 3.6959999999999997,
"grad_norm": 0.41218171564224837,
"learning_rate": 2.155446462249961e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26557302474975586,
"step": 2310,
"valid_targets_mean": 6288.5,
"valid_targets_min": 714
},
{
"epoch": 3.7039999999999997,
"grad_norm": 0.45281061679532264,
"learning_rate": 2.147489723483217e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2626858949661255,
"step": 2315,
"valid_targets_mean": 5368.7,
"valid_targets_min": 1957
},
{
"epoch": 3.7119999999999997,
"grad_norm": 0.48248707648966427,
"learning_rate": 2.139530636867757e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2763807475566864,
"step": 2320,
"valid_targets_mean": 5099.9,
"valid_targets_min": 932
},
{
"epoch": 3.7199999999999998,
"grad_norm": 0.40742401489841945,
"learning_rate": 2.1315693291021114e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25393787026405334,
"step": 2325,
"valid_targets_mean": 5533.6,
"valid_targets_min": 2550
},
{
"epoch": 3.7279999999999998,
"grad_norm": 0.4100080302945935,
"learning_rate": 2.1236059269201686e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520829439163208,
"step": 2330,
"valid_targets_mean": 6048.5,
"valid_targets_min": 2362
},
{
"epoch": 3.7359999999999998,
"grad_norm": 0.45314645842815454,
"learning_rate": 2.1156405570891584e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27272647619247437,
"step": 2335,
"valid_targets_mean": 5500.8,
"valid_targets_min": 613
},
{
"epoch": 3.7439999999999998,
"grad_norm": 0.4026491355138221,
"learning_rate": 2.1076733464076322e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24665513634681702,
"step": 2340,
"valid_targets_mean": 5994.2,
"valid_targets_min": 960
},
{
"epoch": 3.752,
"grad_norm": 0.4702466547059018,
"learning_rate": 2.0997044217034462e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26227515935897827,
"step": 2345,
"valid_targets_mean": 5172.7,
"valid_targets_min": 2105
},
{
"epoch": 3.76,
"grad_norm": 0.4039545878119713,
"learning_rate": 2.0917339098317405e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2739185094833374,
"step": 2350,
"valid_targets_mean": 6585.1,
"valid_targets_min": 2045
},
{
"epoch": 3.768,
"grad_norm": 0.4611875541775836,
"learning_rate": 2.083761937672922e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2752639055252075,
"step": 2355,
"valid_targets_mean": 5468.2,
"valid_targets_min": 802
},
{
"epoch": 3.776,
"grad_norm": 0.47139731269484614,
"learning_rate": 2.0757886321306433e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2621690630912781,
"step": 2360,
"valid_targets_mean": 5031.0,
"valid_targets_min": 1183
},
{
"epoch": 3.784,
"grad_norm": 0.4249388855321063,
"learning_rate": 2.0678141201297827e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22892312705516815,
"step": 2365,
"valid_targets_mean": 5808.9,
"valid_targets_min": 2364
},
{
"epoch": 3.792,
"grad_norm": 0.4520229219931925,
"learning_rate": 2.059838528614423e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26507341861724854,
"step": 2370,
"valid_targets_mean": 5221.9,
"valid_targets_min": 2056
},
{
"epoch": 3.8,
"grad_norm": 0.4200067243880517,
"learning_rate": 2.0518619845458322e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2991790771484375,
"step": 2375,
"valid_targets_mean": 6177.3,
"valid_targets_min": 2232
},
{
"epoch": 3.808,
"grad_norm": 0.38938230112936845,
"learning_rate": 2.0438846149004426e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29206550121307373,
"step": 2380,
"valid_targets_mean": 6879.7,
"valid_targets_min": 3899
},
{
"epoch": 3.816,
"grad_norm": 0.45082171070921734,
"learning_rate": 2.0359065466678268e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27746134996414185,
"step": 2385,
"valid_targets_mean": 5233.9,
"valid_targets_min": 1939
},
{
"epoch": 3.824,
"grad_norm": 0.45232849088890803,
"learning_rate": 2.0279279068486795e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26361560821533203,
"step": 2390,
"valid_targets_mean": 5877.0,
"valid_targets_min": 2719
},
{
"epoch": 3.832,
"grad_norm": 0.459025083974539,
"learning_rate": 2.019948822452794e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2750234007835388,
"step": 2395,
"valid_targets_mean": 5298.2,
"valid_targets_min": 740
},
{
"epoch": 3.84,
"grad_norm": 0.4196361041060983,
"learning_rate": 2.0119694204970393e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2892104387283325,
"step": 2400,
"valid_targets_mean": 6700.9,
"valid_targets_min": 2552
},
{
"epoch": 3.848,
"grad_norm": 0.4133422781214903,
"learning_rate": 2.0039898280033414e-05,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2697451412677765,
"step": 2405,
"valid_targets_mean": 5783.1,
"valid_targets_min": 1798
},
{
"epoch": 3.856,
"grad_norm": 0.42185605892875344,
"learning_rate": 1.9960101719966592e-05,
"loss": 0.2775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788695693016052,
"step": 2410,
"valid_targets_mean": 5466.9,
"valid_targets_min": 2780
},
{
"epoch": 3.864,
"grad_norm": 0.4065091466238856,
"learning_rate": 1.9880305795029617e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26106393337249756,
"step": 2415,
"valid_targets_mean": 5957.0,
"valid_targets_min": 2787
},
{
"epoch": 3.872,
"grad_norm": 0.4350518885133558,
"learning_rate": 1.980051177547207e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2566600441932678,
"step": 2420,
"valid_targets_mean": 5157.2,
"valid_targets_min": 2272
},
{
"epoch": 3.88,
"grad_norm": 0.43647694712355944,
"learning_rate": 1.9720720931513212e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27034640312194824,
"step": 2425,
"valid_targets_mean": 5680.7,
"valid_targets_min": 2868
},
{
"epoch": 3.888,
"grad_norm": 0.4465441645571561,
"learning_rate": 1.9640934533321735e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533532977104187,
"step": 2430,
"valid_targets_mean": 4983.7,
"valid_targets_min": 1607
},
{
"epoch": 3.896,
"grad_norm": 0.4948292300701761,
"learning_rate": 1.9561153850995577e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2283918261528015,
"step": 2435,
"valid_targets_mean": 4227.5,
"valid_targets_min": 2344
},
{
"epoch": 3.904,
"grad_norm": 0.4484712258176857,
"learning_rate": 1.948138015454168e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28464293479919434,
"step": 2440,
"valid_targets_mean": 5670.1,
"valid_targets_min": 2449
},
{
"epoch": 3.912,
"grad_norm": 0.43934564876974813,
"learning_rate": 1.9401614713855775e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26345354318618774,
"step": 2445,
"valid_targets_mean": 5403.1,
"valid_targets_min": 707
},
{
"epoch": 3.92,
"grad_norm": 0.416395054814685,
"learning_rate": 1.932185879870218e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25871995091438293,
"step": 2450,
"valid_targets_mean": 5303.6,
"valid_targets_min": 2395
},
{
"epoch": 3.928,
"grad_norm": 0.43694368425623087,
"learning_rate": 1.924211367869357e-05,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24475713074207306,
"step": 2455,
"valid_targets_mean": 5055.1,
"valid_targets_min": 2806
},
{
"epoch": 3.936,
"grad_norm": 0.4243501892440525,
"learning_rate": 1.9162380623270783e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22306443750858307,
"step": 2460,
"valid_targets_mean": 5135.1,
"valid_targets_min": 2248
},
{
"epoch": 3.944,
"grad_norm": 0.44283286109138925,
"learning_rate": 1.90826609016826e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637837529182434,
"step": 2465,
"valid_targets_mean": 5476.3,
"valid_targets_min": 759
},
{
"epoch": 3.952,
"grad_norm": 0.42470717124634133,
"learning_rate": 1.9002955782965548e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27605631947517395,
"step": 2470,
"valid_targets_mean": 5417.3,
"valid_targets_min": 2605
},
{
"epoch": 3.96,
"grad_norm": 0.3803343612948792,
"learning_rate": 1.8923266535923688e-05,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2890893220901489,
"step": 2475,
"valid_targets_mean": 7136.2,
"valid_targets_min": 3811
},
{
"epoch": 3.968,
"grad_norm": 0.4130261601006259,
"learning_rate": 1.8843594429108426e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2711412012577057,
"step": 2480,
"valid_targets_mean": 6824.2,
"valid_targets_min": 2246
},
{
"epoch": 3.976,
"grad_norm": 0.4468048565381207,
"learning_rate": 1.8763940730798324e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2685108482837677,
"step": 2485,
"valid_targets_mean": 4759.8,
"valid_targets_min": 763
},
{
"epoch": 3.984,
"grad_norm": 0.45251787058208964,
"learning_rate": 1.8684306708978896e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934056222438812,
"step": 2490,
"valid_targets_mean": 4659.1,
"valid_targets_min": 920
},
{
"epoch": 3.992,
"grad_norm": 0.43509351569725757,
"learning_rate": 1.8604693631322433e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24598343670368195,
"step": 2495,
"valid_targets_mean": 4712.8,
"valid_targets_min": 607
},
{
"epoch": 4.0,
"grad_norm": 0.4139875035737289,
"learning_rate": 1.852510276516783e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22778859734535217,
"step": 2500,
"valid_targets_mean": 5029.6,
"valid_targets_min": 2780
},
{
"epoch": 4.008,
"grad_norm": 0.4026517254214821,
"learning_rate": 1.8445535377500393e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527252435684204,
"step": 2505,
"valid_targets_mean": 5420.4,
"valid_targets_min": 804
},
{
"epoch": 4.016,
"grad_norm": 0.527046696353138,
"learning_rate": 1.8365992734931686e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23123949766159058,
"step": 2510,
"valid_targets_mean": 4485.6,
"valid_targets_min": 932
},
{
"epoch": 4.024,
"grad_norm": 0.4502829884248935,
"learning_rate": 1.8286476103679356e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25222235918045044,
"step": 2515,
"valid_targets_mean": 5331.8,
"valid_targets_min": 2508
},
{
"epoch": 4.032,
"grad_norm": 0.40196394658018636,
"learning_rate": 1.8206986749546992e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2326112687587738,
"step": 2520,
"valid_targets_mean": 5491.2,
"valid_targets_min": 2650
},
{
"epoch": 4.04,
"grad_norm": 0.4419760841326031,
"learning_rate": 1.8127525937903957e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25284963846206665,
"step": 2525,
"valid_targets_mean": 5374.3,
"valid_targets_min": 724
},
{
"epoch": 4.048,
"grad_norm": 0.563487988263502,
"learning_rate": 1.8048094933665262e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23597420752048492,
"step": 2530,
"valid_targets_mean": 4752.8,
"valid_targets_min": 2266
},
{
"epoch": 4.056,
"grad_norm": 0.4207542474689084,
"learning_rate": 1.7968695001271416e-05,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25209924578666687,
"step": 2535,
"valid_targets_mean": 5711.2,
"valid_targets_min": 2319
},
{
"epoch": 4.064,
"grad_norm": 0.4164797883736113,
"learning_rate": 1.7889327404668316e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26291561126708984,
"step": 2540,
"valid_targets_mean": 5958.5,
"valid_targets_min": 3351
},
{
"epoch": 4.072,
"grad_norm": 0.4280721543502966,
"learning_rate": 1.7809993407287083e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563862204551697,
"step": 2545,
"valid_targets_mean": 5596.1,
"valid_targets_min": 2016
},
{
"epoch": 4.08,
"grad_norm": 0.41964916244227835,
"learning_rate": 1.7730694272024018e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2623998522758484,
"step": 2550,
"valid_targets_mean": 5987.8,
"valid_targets_min": 711
},
{
"epoch": 4.088,
"grad_norm": 0.4050228919933895,
"learning_rate": 1.765143126122044e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23614199459552765,
"step": 2555,
"valid_targets_mean": 5699.4,
"valid_targets_min": 2592
},
{
"epoch": 4.096,
"grad_norm": 0.3910248661150996,
"learning_rate": 1.7572205636642622e-05,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25823622941970825,
"step": 2560,
"valid_targets_mean": 7367.4,
"valid_targets_min": 3276
},
{
"epoch": 4.104,
"grad_norm": 0.42236355425116934,
"learning_rate": 1.749301865946169e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2622085511684418,
"step": 2565,
"valid_targets_mean": 5688.9,
"valid_targets_min": 2657
},
{
"epoch": 4.112,
"grad_norm": 0.42509311490729107,
"learning_rate": 1.7413871590233557e-05,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2588081359863281,
"step": 2570,
"valid_targets_mean": 6006.1,
"valid_targets_min": 1061
},
{
"epoch": 4.12,
"grad_norm": 0.4057780074446429,
"learning_rate": 1.7334765688878848e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23342590034008026,
"step": 2575,
"valid_targets_mean": 5994.2,
"valid_targets_min": 3506
},
{
"epoch": 4.128,
"grad_norm": 0.4581070105994256,
"learning_rate": 1.7255702214662852e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26349925994873047,
"step": 2580,
"valid_targets_mean": 5232.7,
"valid_targets_min": 549
},
{
"epoch": 4.136,
"grad_norm": 0.4166464687342281,
"learning_rate": 1.7176682426175468e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.251516729593277,
"step": 2585,
"valid_targets_mean": 5601.5,
"valid_targets_min": 2340
},
{
"epoch": 4.144,
"grad_norm": 0.4657055090249881,
"learning_rate": 1.709770758131118e-05,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23418261110782623,
"step": 2590,
"valid_targets_mean": 4537.5,
"valid_targets_min": 2258
},
{
"epoch": 4.152,
"grad_norm": 0.4116673541052104,
"learning_rate": 1.7018778937249017e-05,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24612781405448914,
"step": 2595,
"valid_targets_mean": 6193.2,
"valid_targets_min": 2229
},
{
"epoch": 4.16,
"grad_norm": 0.4340572439834897,
"learning_rate": 1.6939897750432562e-05,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2452816367149353,
"step": 2600,
"valid_targets_mean": 5402.6,
"valid_targets_min": 1660
},
{
"epoch": 4.168,
"grad_norm": 0.43025994341938056,
"learning_rate": 1.6861065276549933e-05,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2600667476654053,
"step": 2605,
"valid_targets_mean": 5861.5,
"valid_targets_min": 2402
},
{
"epoch": 4.176,
"grad_norm": 0.42608335179914697,
"learning_rate": 1.6782282770513788e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23782122135162354,
"step": 2610,
"valid_targets_mean": 5192.6,
"valid_targets_min": 2508
},
{
"epoch": 4.184,
"grad_norm": 0.4277951887838342,
"learning_rate": 1.6703551486441382e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25356531143188477,
"step": 2615,
"valid_targets_mean": 5669.9,
"valid_targets_min": 1543
},
{
"epoch": 4.192,
"grad_norm": 0.4609230061476829,
"learning_rate": 1.6624872677634565e-05,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24406729638576508,
"step": 2620,
"valid_targets_mean": 4672.6,
"valid_targets_min": 2794
},
{
"epoch": 4.2,
"grad_norm": 0.40355339238632393,
"learning_rate": 1.654624759655986e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29306623339653015,
"step": 2625,
"valid_targets_mean": 6442.0,
"valid_targets_min": 2237
},
{
"epoch": 4.208,
"grad_norm": 0.425607995518686,
"learning_rate": 1.64676774948285e-05,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23136329650878906,
"step": 2630,
"valid_targets_mean": 5687.0,
"valid_targets_min": 2907
},
{
"epoch": 4.216,
"grad_norm": 0.42610729575271533,
"learning_rate": 1.6389163623176536e-05,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25710445642471313,
"step": 2635,
"valid_targets_mean": 5690.4,
"valid_targets_min": 2275
},
{
"epoch": 4.224,
"grad_norm": 0.4502455592506156,
"learning_rate": 1.6310707231444884e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25009778141975403,
"step": 2640,
"valid_targets_mean": 5083.6,
"valid_targets_min": 2693
},
{
"epoch": 4.232,
"grad_norm": 0.42929174971662437,
"learning_rate": 1.623230956855947e-05,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24527814984321594,
"step": 2645,
"valid_targets_mean": 5330.5,
"valid_targets_min": 2359
},
{
"epoch": 4.24,
"grad_norm": 0.38173395631546464,
"learning_rate": 1.6153971882511324e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2393120527267456,
"step": 2650,
"valid_targets_mean": 6225.8,
"valid_targets_min": 3329
},
{
"epoch": 4.248,
"grad_norm": 0.3933433949338803,
"learning_rate": 1.6075695420336724e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2711977958679199,
"step": 2655,
"valid_targets_mean": 6330.6,
"valid_targets_min": 2363
},
{
"epoch": 4.256,
"grad_norm": 0.4121284121686269,
"learning_rate": 1.5997481428097338e-05,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24723577499389648,
"step": 2660,
"valid_targets_mean": 5960.3,
"valid_targets_min": 3191
},
{
"epoch": 4.264,
"grad_norm": 0.3882119749671396,
"learning_rate": 1.5919331150860396e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718477249145508,
"step": 2665,
"valid_targets_mean": 6472.1,
"valid_targets_min": 3292
},
{
"epoch": 4.272,
"grad_norm": 0.4100674855225304,
"learning_rate": 1.5841245832678873e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23369711637496948,
"step": 2670,
"valid_targets_mean": 5683.4,
"valid_targets_min": 763
},
{
"epoch": 4.28,
"grad_norm": 0.41838795378288424,
"learning_rate": 1.576322671657166e-05,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2701454758644104,
"step": 2675,
"valid_targets_mean": 6447.2,
"valid_targets_min": 2868
},
{
"epoch": 4.288,
"grad_norm": 0.4400893801670801,
"learning_rate": 1.5685275044503804e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24263077974319458,
"step": 2680,
"valid_targets_mean": 5147.9,
"valid_targets_min": 2684
},
{
"epoch": 4.296,
"grad_norm": 0.46173199977270163,
"learning_rate": 1.560739205736674e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26507413387298584,
"step": 2685,
"valid_targets_mean": 5198.1,
"valid_targets_min": 613
},
{
"epoch": 4.304,
"grad_norm": 0.45496647831386733,
"learning_rate": 1.552957899495851e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521948218345642,
"step": 2690,
"valid_targets_mean": 4976.4,
"valid_targets_min": 1184
},
{
"epoch": 4.312,
"grad_norm": 0.4633484681626059,
"learning_rate": 1.5451837095964054e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26329267024993896,
"step": 2695,
"valid_targets_mean": 5536.6,
"valid_targets_min": 802
},
{
"epoch": 4.32,
"grad_norm": 0.3777915678980122,
"learning_rate": 1.5374167597935478e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2505547106266022,
"step": 2700,
"valid_targets_mean": 7020.2,
"valid_targets_min": 3721
},
{
"epoch": 4.328,
"grad_norm": 0.432513339772364,
"learning_rate": 1.5296571737272354e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26320308446884155,
"step": 2705,
"valid_targets_mean": 5831.6,
"valid_targets_min": 2076
},
{
"epoch": 4.336,
"grad_norm": 0.4259936130726487,
"learning_rate": 1.5219050749202037e-05,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26931965351104736,
"step": 2710,
"valid_targets_mean": 5925.8,
"valid_targets_min": 3057
},
{
"epoch": 4.344,
"grad_norm": 0.43484781101199177,
"learning_rate": 1.5141605867760021e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2746845483779907,
"step": 2715,
"valid_targets_mean": 5499.1,
"valid_targets_min": 879
},
{
"epoch": 4.352,
"grad_norm": 0.4240116184683575,
"learning_rate": 1.5064238325770267e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27649781107902527,
"step": 2720,
"valid_targets_mean": 6327.1,
"valid_targets_min": 3023
},
{
"epoch": 4.36,
"grad_norm": 0.46160595397956594,
"learning_rate": 1.498694935482559e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23835043609142303,
"step": 2725,
"valid_targets_mean": 4995.6,
"valid_targets_min": 384
},
{
"epoch": 4.368,
"grad_norm": 0.42449896176713736,
"learning_rate": 1.4909740185268056e-05,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3132569193840027,
"step": 2730,
"valid_targets_mean": 7493.7,
"valid_targets_min": 2898
},
{
"epoch": 4.376,
"grad_norm": 0.4634859796301222,
"learning_rate": 1.4832612046169408e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26285839080810547,
"step": 2735,
"valid_targets_mean": 4890.0,
"valid_targets_min": 920
},
{
"epoch": 4.384,
"grad_norm": 0.5118855317119525,
"learning_rate": 1.4755566165311455e-05,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2320340871810913,
"step": 2740,
"valid_targets_mean": 4532.7,
"valid_targets_min": 834
},
{
"epoch": 4.392,
"grad_norm": 0.3720350693877654,
"learning_rate": 1.4678603769166591e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26782023906707764,
"step": 2745,
"valid_targets_mean": 7465.8,
"valid_targets_min": 2616
},
{
"epoch": 4.4,
"grad_norm": 0.38971835604206173,
"learning_rate": 1.4601726082878226e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792567014694214,
"step": 2750,
"valid_targets_mean": 6849.9,
"valid_targets_min": 2097
},
{
"epoch": 4.408,
"grad_norm": 0.40344159503778143,
"learning_rate": 1.4524934330241292e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851219177246094,
"step": 2755,
"valid_targets_mean": 6309.6,
"valid_targets_min": 2719
},
{
"epoch": 4.416,
"grad_norm": 0.3938933697532101,
"learning_rate": 1.4448229733682784e-05,
"loss": 0.257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23094943165779114,
"step": 2760,
"valid_targets_mean": 5509.4,
"valid_targets_min": 499
},
{
"epoch": 4.424,
"grad_norm": 0.41239113282985423,
"learning_rate": 1.4371613514242264e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564051151275635,
"step": 2765,
"valid_targets_mean": 6004.9,
"valid_targets_min": 664
},
{
"epoch": 4.432,
"grad_norm": 0.3935389062042307,
"learning_rate": 1.4295086891552457e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2657475769519806,
"step": 2770,
"valid_targets_mean": 6504.3,
"valid_targets_min": 3996
},
{
"epoch": 4.44,
"grad_norm": 0.445989307618548,
"learning_rate": 1.4218651083819811e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23502030968666077,
"step": 2775,
"valid_targets_mean": 5178.3,
"valid_targets_min": 2092
},
{
"epoch": 4.448,
"grad_norm": 0.4197509448438314,
"learning_rate": 1.4142307307805125e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24606627225875854,
"step": 2780,
"valid_targets_mean": 5779.6,
"valid_targets_min": 2508
},
{
"epoch": 4.456,
"grad_norm": 0.4511017310825799,
"learning_rate": 1.406605677880416e-05,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24840837717056274,
"step": 2785,
"valid_targets_mean": 5349.4,
"valid_targets_min": 2473
},
{
"epoch": 4.464,
"grad_norm": 0.45567039640007745,
"learning_rate": 1.3989900710628313e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618921995162964,
"step": 2790,
"valid_targets_mean": 5036.2,
"valid_targets_min": 542
},
{
"epoch": 4.4719999999999995,
"grad_norm": 0.43962860716408275,
"learning_rate": 1.3913840315585279e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27140137553215027,
"step": 2795,
"valid_targets_mean": 5845.9,
"valid_targets_min": 2457
},
{
"epoch": 4.48,
"grad_norm": 0.43611294833451114,
"learning_rate": 1.3837876804459765e-05,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25768083333969116,
"step": 2800,
"valid_targets_mean": 5575.6,
"valid_targets_min": 746
},
{
"epoch": 4.4879999999999995,
"grad_norm": 0.42803383496080244,
"learning_rate": 1.3762011386494191e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2686399519443512,
"step": 2805,
"valid_targets_mean": 5792.1,
"valid_targets_min": 921
},
{
"epoch": 4.496,
"grad_norm": 0.4719245633331461,
"learning_rate": 1.3686245269369485e-05,
"loss": 0.2663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30958646535873413,
"step": 2810,
"valid_targets_mean": 6427.6,
"valid_targets_min": 1017
},
{
"epoch": 4.504,
"grad_norm": 0.4237505355734542,
"learning_rate": 1.3610579659185809e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26016536355018616,
"step": 2815,
"valid_targets_mean": 5658.1,
"valid_targets_min": 720
},
{
"epoch": 4.5120000000000005,
"grad_norm": 0.38024984937490686,
"learning_rate": 1.35350157604434e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725783586502075,
"step": 2820,
"valid_targets_mean": 6973.2,
"valid_targets_min": 2168
},
{
"epoch": 4.52,
"grad_norm": 0.41952130341304616,
"learning_rate": 1.345955477602337e-05,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26130425930023193,
"step": 2825,
"valid_targets_mean": 6372.4,
"valid_targets_min": 1173
},
{
"epoch": 4.5280000000000005,
"grad_norm": 0.4528337053842432,
"learning_rate": 1.3384197907168561e-05,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25075584650039673,
"step": 2830,
"valid_targets_mean": 5724.8,
"valid_targets_min": 2776
},
{
"epoch": 4.536,
"grad_norm": 0.41288983796665957,
"learning_rate": 1.3308946353464438e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24849629402160645,
"step": 2835,
"valid_targets_mean": 5834.9,
"valid_targets_min": 2456
},
{
"epoch": 4.5440000000000005,
"grad_norm": 0.4109103515660612,
"learning_rate": 1.3233801312819979e-05,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24398134648799896,
"step": 2840,
"valid_targets_mean": 5745.9,
"valid_targets_min": 3589
},
{
"epoch": 4.552,
"grad_norm": 0.41889125877984157,
"learning_rate": 1.3158763981448606e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618812620639801,
"step": 2845,
"valid_targets_mean": 6272.4,
"valid_targets_min": 1666
},
{
"epoch": 4.5600000000000005,
"grad_norm": 0.4550626345785704,
"learning_rate": 1.3083835553849148e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2640746831893921,
"step": 2850,
"valid_targets_mean": 5556.9,
"valid_targets_min": 1918
},
{
"epoch": 4.568,
"grad_norm": 0.4316185089835862,
"learning_rate": 1.3009017222786828e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707984745502472,
"step": 2855,
"valid_targets_mean": 5878.1,
"valid_targets_min": 2964
},
{
"epoch": 4.576,
"grad_norm": 0.3506904633597355,
"learning_rate": 1.2934310179274269e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24263477325439453,
"step": 2860,
"valid_targets_mean": 7210.3,
"valid_targets_min": 2190
},
{
"epoch": 4.584,
"grad_norm": 0.3830616811150377,
"learning_rate": 1.2859715612552541e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22636298835277557,
"step": 2865,
"valid_targets_mean": 6734.7,
"valid_targets_min": 2555
},
{
"epoch": 4.592,
"grad_norm": 0.4555586317701132,
"learning_rate": 1.278523471007223e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2616588771343231,
"step": 2870,
"valid_targets_mean": 5836.5,
"valid_targets_min": 3143
},
{
"epoch": 4.6,
"grad_norm": 0.45645747710035556,
"learning_rate": 1.271086865747451e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24527783691883087,
"step": 2875,
"valid_targets_mean": 5121.6,
"valid_targets_min": 2841
},
{
"epoch": 4.608,
"grad_norm": 0.466642440212726,
"learning_rate": 1.2636618638572316e-05,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527911067008972,
"step": 2880,
"valid_targets_mean": 5101.9,
"valid_targets_min": 997
},
{
"epoch": 4.616,
"grad_norm": 0.46937573930033066,
"learning_rate": 1.2562485835331466e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2864949405193329,
"step": 2885,
"valid_targets_mean": 5126.4,
"valid_targets_min": 442
},
{
"epoch": 4.624,
"grad_norm": 0.46822865956269294,
"learning_rate": 1.2488471427851852e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28379178047180176,
"step": 2890,
"valid_targets_mean": 6053.8,
"valid_targets_min": 970
},
{
"epoch": 4.632,
"grad_norm": 0.45941682547920754,
"learning_rate": 1.241457659434866e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27936357259750366,
"step": 2895,
"valid_targets_mean": 5776.1,
"valid_targets_min": 3188
},
{
"epoch": 4.64,
"grad_norm": 0.4385032906332573,
"learning_rate": 1.2340802511133605e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2690129578113556,
"step": 2900,
"valid_targets_mean": 5771.6,
"valid_targets_min": 1872
},
{
"epoch": 4.648,
"grad_norm": 0.3719833844478648,
"learning_rate": 1.2267150352596216e-05,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24423128366470337,
"step": 2905,
"valid_targets_mean": 6587.7,
"valid_targets_min": 2041
},
{
"epoch": 4.656,
"grad_norm": 0.49249405276783137,
"learning_rate": 1.2193621291185132e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2529935836791992,
"step": 2910,
"valid_targets_mean": 5225.8,
"valid_targets_min": 1416
},
{
"epoch": 4.664,
"grad_norm": 0.41781331593173815,
"learning_rate": 1.2120216497389446e-05,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2483152151107788,
"step": 2915,
"valid_targets_mean": 5744.6,
"valid_targets_min": 2086
},
{
"epoch": 4.672,
"grad_norm": 0.4047966801272431,
"learning_rate": 1.2046937139720068e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2477341890335083,
"step": 2920,
"valid_targets_mean": 5689.0,
"valid_targets_min": 759
},
{
"epoch": 4.68,
"grad_norm": 0.37498929916376766,
"learning_rate": 1.1973784384691121e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2430843859910965,
"step": 2925,
"valid_targets_mean": 7156.9,
"valid_targets_min": 2993
},
{
"epoch": 4.688,
"grad_norm": 0.41388324850358565,
"learning_rate": 1.1900759396801382e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2551068067550659,
"step": 2930,
"valid_targets_mean": 6077.2,
"valid_targets_min": 3013
},
{
"epoch": 4.696,
"grad_norm": 0.36861725664383904,
"learning_rate": 1.1827863338515741e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571861445903778,
"step": 2935,
"valid_targets_mean": 6625.1,
"valid_targets_min": 824
},
{
"epoch": 4.704,
"grad_norm": 0.48378743134760654,
"learning_rate": 1.1755097370246669e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2558562457561493,
"step": 2940,
"valid_targets_mean": 5220.9,
"valid_targets_min": 2269
},
{
"epoch": 4.712,
"grad_norm": 0.4406782311453092,
"learning_rate": 1.1682462650335791e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25980138778686523,
"step": 2945,
"valid_targets_mean": 5291.1,
"valid_targets_min": 2112
},
{
"epoch": 4.72,
"grad_norm": 0.4219789914017073,
"learning_rate": 1.1609960335035423e-05,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28451454639434814,
"step": 2950,
"valid_targets_mean": 6052.9,
"valid_targets_min": 2838
},
{
"epoch": 4.728,
"grad_norm": 0.4542496598947857,
"learning_rate": 1.1537591578490165e-05,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24413950741291046,
"step": 2955,
"valid_targets_mean": 4976.8,
"valid_targets_min": 735
},
{
"epoch": 4.736,
"grad_norm": 0.43241503805052256,
"learning_rate": 1.146535753271853e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23115313053131104,
"step": 2960,
"valid_targets_mean": 4997.9,
"valid_targets_min": 2360
},
{
"epoch": 4.744,
"grad_norm": 0.44686143386709815,
"learning_rate": 1.139325934759461e-05,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26531267166137695,
"step": 2965,
"valid_targets_mean": 5456.7,
"valid_targets_min": 760
},
{
"epoch": 4.752,
"grad_norm": 0.4012430319952668,
"learning_rate": 1.1321298170829768e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565727233886719,
"step": 2970,
"valid_targets_mean": 6016.4,
"valid_targets_min": 786
},
{
"epoch": 4.76,
"grad_norm": 0.40873161812607367,
"learning_rate": 1.1249475147954363e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28063255548477173,
"step": 2975,
"valid_targets_mean": 6314.0,
"valid_targets_min": 2924
},
{
"epoch": 4.768,
"grad_norm": 0.3764269524348353,
"learning_rate": 1.1177791422299528e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501315474510193,
"step": 2980,
"valid_targets_mean": 6623.1,
"valid_targets_min": 4202
},
{
"epoch": 4.776,
"grad_norm": 0.4295656083509184,
"learning_rate": 1.1106248134978959e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2510390281677246,
"step": 2985,
"valid_targets_mean": 5810.9,
"valid_targets_min": 2502
},
{
"epoch": 4.784,
"grad_norm": 0.4286687447325965,
"learning_rate": 1.1034846424870744e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772992253303528,
"step": 2990,
"valid_targets_mean": 5971.2,
"valid_targets_min": 2590
},
{
"epoch": 4.792,
"grad_norm": 0.374726299286535,
"learning_rate": 1.0963587428599256e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24093443155288696,
"step": 2995,
"valid_targets_mean": 6393.6,
"valid_targets_min": 2733
},
{
"epoch": 4.8,
"grad_norm": 0.39305947450528317,
"learning_rate": 1.089247228051704e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26492711901664734,
"step": 3000,
"valid_targets_mean": 6464.1,
"valid_targets_min": 902
},
{
"epoch": 4.808,
"grad_norm": 0.43173986170046935,
"learning_rate": 1.0821502112686753e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26849010586738586,
"step": 3005,
"valid_targets_mean": 6025.8,
"valid_targets_min": 876
},
{
"epoch": 4.816,
"grad_norm": 0.553114591599834,
"learning_rate": 1.0750678054863158e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25507980585098267,
"step": 3010,
"valid_targets_mean": 5294.4,
"valid_targets_min": 2993
},
{
"epoch": 4.824,
"grad_norm": 0.4183913969010833,
"learning_rate": 1.0680001234475127e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23742127418518066,
"step": 3015,
"valid_targets_mean": 5359.8,
"valid_targets_min": 2555
},
{
"epoch": 4.832,
"grad_norm": 0.41631043723949235,
"learning_rate": 1.0609472776607715e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26865795254707336,
"step": 3020,
"valid_targets_mean": 6159.6,
"valid_targets_min": 2405
},
{
"epoch": 4.84,
"grad_norm": 0.4078093943828265,
"learning_rate": 1.0539093803984217e-05,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24415555596351624,
"step": 3025,
"valid_targets_mean": 5986.4,
"valid_targets_min": 2063
},
{
"epoch": 4.848,
"grad_norm": 0.40603508493805524,
"learning_rate": 1.046886543694832e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2623901069164276,
"step": 3030,
"valid_targets_mean": 6127.6,
"valid_targets_min": 2081
},
{
"epoch": 4.856,
"grad_norm": 0.49406303870996265,
"learning_rate": 1.0398788793446263e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2604304552078247,
"step": 3035,
"valid_targets_mean": 4751.2,
"valid_targets_min": 779
},
{
"epoch": 4.864,
"grad_norm": 0.44990796885772155,
"learning_rate": 1.0328864989009037e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26390713453292847,
"step": 3040,
"valid_targets_mean": 5145.4,
"valid_targets_min": 2084
},
{
"epoch": 4.872,
"grad_norm": 0.42810640807420824,
"learning_rate": 1.0259095136734634e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291616827249527,
"step": 3045,
"valid_targets_mean": 6583.1,
"valid_targets_min": 1114
},
{
"epoch": 4.88,
"grad_norm": 0.4597136382960901,
"learning_rate": 1.0189480347270311e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22865967452526093,
"step": 3050,
"valid_targets_mean": 4451.9,
"valid_targets_min": 610
},
{
"epoch": 4.888,
"grad_norm": 0.4458559434583576,
"learning_rate": 1.0120021728794938e-05,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27014094591140747,
"step": 3055,
"valid_targets_mean": 6275.8,
"valid_targets_min": 2201
},
{
"epoch": 4.896,
"grad_norm": 0.4071136411439628,
"learning_rate": 1.0050720387001334e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24810561537742615,
"step": 3060,
"valid_targets_mean": 6389.0,
"valid_targets_min": 2924
},
{
"epoch": 4.904,
"grad_norm": 0.4038730028965521,
"learning_rate": 9.981577425078672e-06,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24336443841457367,
"step": 3065,
"valid_targets_mean": 5670.3,
"valid_targets_min": 740
},
{
"epoch": 4.912,
"grad_norm": 0.43517093885534663,
"learning_rate": 9.912593943694924e-06,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2760591506958008,
"step": 3070,
"valid_targets_mean": 5472.9,
"valid_targets_min": 783
},
{
"epoch": 4.92,
"grad_norm": 0.4227928570500053,
"learning_rate": 9.843771040979328e-06,
"loss": 0.2549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25480031967163086,
"step": 3075,
"valid_targets_mean": 6020.2,
"valid_targets_min": 2221
},
{
"epoch": 4.928,
"grad_norm": 0.4684683751640332,
"learning_rate": 9.775109812504922e-06,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2481108158826828,
"step": 3080,
"valid_targets_mean": 4860.8,
"valid_targets_min": 2502
},
{
"epoch": 4.936,
"grad_norm": 0.447379036311016,
"learning_rate": 9.706611351271088e-06,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520700693130493,
"step": 3085,
"valid_targets_mean": 5130.7,
"valid_targets_min": 2504
},
{
"epoch": 4.944,
"grad_norm": 0.4383325246904605,
"learning_rate": 9.638276747686169e-06,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24543023109436035,
"step": 3090,
"valid_targets_mean": 5125.6,
"valid_targets_min": 2175
},
{
"epoch": 4.952,
"grad_norm": 0.4352567562200437,
"learning_rate": 9.570107089550091e-06,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787247896194458,
"step": 3095,
"valid_targets_mean": 4917.8,
"valid_targets_min": 2301
},
{
"epoch": 4.96,
"grad_norm": 0.4604774036965585,
"learning_rate": 9.502103462037074e-06,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525831460952759,
"step": 3100,
"valid_targets_mean": 5261.8,
"valid_targets_min": 1041
},
{
"epoch": 4.968,
"grad_norm": 0.37947111921277665,
"learning_rate": 9.434266947678326e-06,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2499474585056305,
"step": 3105,
"valid_targets_mean": 7018.6,
"valid_targets_min": 3738
},
{
"epoch": 4.976,
"grad_norm": 0.4605718602465518,
"learning_rate": 9.366598626344836e-06,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23395417630672455,
"step": 3110,
"valid_targets_mean": 4318.6,
"valid_targets_min": 918
},
{
"epoch": 4.984,
"grad_norm": 0.408558726874829,
"learning_rate": 9.299099575230172e-06,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292435884475708,
"step": 3115,
"valid_targets_mean": 6323.2,
"valid_targets_min": 2397
},
{
"epoch": 4.992,
"grad_norm": 0.484634939648324,
"learning_rate": 9.231770868833334e-06,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561487555503845,
"step": 3120,
"valid_targets_mean": 5338.1,
"valid_targets_min": 2595
},
{
"epoch": 5.0,
"grad_norm": 0.45839751766225767,
"learning_rate": 9.164613578941652e-06,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28931480646133423,
"step": 3125,
"valid_targets_mean": 4836.5,
"valid_targets_min": 428
},
{
"epoch": 5.008,
"grad_norm": 0.4182833320275383,
"learning_rate": 9.097628774613732e-06,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569211721420288,
"step": 3130,
"valid_targets_mean": 5781.9,
"valid_targets_min": 2451
},
{
"epoch": 5.016,
"grad_norm": 0.4209600786624088,
"learning_rate": 9.030817522162403e-06,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2324075996875763,
"step": 3135,
"valid_targets_mean": 5339.5,
"valid_targets_min": 793
},
{
"epoch": 5.024,
"grad_norm": 0.44851688512328064,
"learning_rate": 8.964180885137797e-06,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2408837378025055,
"step": 3140,
"valid_targets_mean": 5425.8,
"valid_targets_min": 2716
},
{
"epoch": 5.032,
"grad_norm": 0.484323206155298,
"learning_rate": 8.897719924310375e-06,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2470928132534027,
"step": 3145,
"valid_targets_mean": 4851.0,
"valid_targets_min": 627
},
{
"epoch": 5.04,
"grad_norm": 0.4623710689089007,
"learning_rate": 8.831435697654068e-06,
"loss": 0.2455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25896331667900085,
"step": 3150,
"valid_targets_mean": 5875.5,
"valid_targets_min": 1335
},
{
"epoch": 5.048,
"grad_norm": 0.4119943346269266,
"learning_rate": 8.765329260329413e-06,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26245784759521484,
"step": 3155,
"valid_targets_mean": 6056.2,
"valid_targets_min": 2070
},
{
"epoch": 5.056,
"grad_norm": 0.4107422408390761,
"learning_rate": 8.699401664666774e-06,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24972708523273468,
"step": 3160,
"valid_targets_mean": 6400.5,
"valid_targets_min": 784
},
{
"epoch": 5.064,
"grad_norm": 0.34537901545202443,
"learning_rate": 8.633653960149579e-06,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23936009407043457,
"step": 3165,
"valid_targets_mean": 7169.5,
"valid_targets_min": 1933
},
{
"epoch": 5.072,
"grad_norm": 0.44020015097063847,
"learning_rate": 8.56808719339762e-06,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26007118821144104,
"step": 3170,
"valid_targets_mean": 5437.1,
"valid_targets_min": 2662
},
{
"epoch": 5.08,
"grad_norm": 0.3670993210107219,
"learning_rate": 8.502702408150391e-06,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2242787927389145,
"step": 3175,
"valid_targets_mean": 6277.2,
"valid_targets_min": 2027
},
{
"epoch": 5.088,
"grad_norm": 0.4378221792589208,
"learning_rate": 8.43750064525047e-06,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22399312257766724,
"step": 3180,
"valid_targets_mean": 5389.4,
"valid_targets_min": 2389
},
{
"epoch": 5.096,
"grad_norm": 0.4892555740387963,
"learning_rate": 8.372482942626952e-06,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311638444662094,
"step": 3185,
"valid_targets_mean": 4608.6,
"valid_targets_min": 1941
},
{
"epoch": 5.104,
"grad_norm": 0.4389530297089188,
"learning_rate": 8.307650335278927e-06,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2438417673110962,
"step": 3190,
"valid_targets_mean": 5221.5,
"valid_targets_min": 2204
},
{
"epoch": 5.112,
"grad_norm": 0.4447312980181925,
"learning_rate": 8.243003855259015e-06,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23452109098434448,
"step": 3195,
"valid_targets_mean": 4981.2,
"valid_targets_min": 2463
},
{
"epoch": 5.12,
"grad_norm": 0.43191387980796925,
"learning_rate": 8.178544531656897e-06,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2466181516647339,
"step": 3200,
"valid_targets_mean": 6129.1,
"valid_targets_min": 3720
},
{
"epoch": 5.128,
"grad_norm": 0.402538872085775,
"learning_rate": 8.11427339058299e-06,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25876384973526,
"step": 3205,
"valid_targets_mean": 6184.6,
"valid_targets_min": 1409
},
{
"epoch": 5.136,
"grad_norm": 0.4860220056729548,
"learning_rate": 8.050191455152072e-06,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506711184978485,
"step": 3210,
"valid_targets_mean": 4799.5,
"valid_targets_min": 418
},
{
"epoch": 5.144,
"grad_norm": 0.48057095956799106,
"learning_rate": 7.986299745467013e-06,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25175127387046814,
"step": 3215,
"valid_targets_mean": 5248.0,
"valid_targets_min": 2555
},
{
"epoch": 5.152,
"grad_norm": 0.45862189357281363,
"learning_rate": 7.922599278602524e-06,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20885488390922546,
"step": 3220,
"valid_targets_mean": 4904.6,
"valid_targets_min": 2321
},
{
"epoch": 5.16,
"grad_norm": 0.41829998931400625,
"learning_rate": 7.859091068588987e-06,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23560893535614014,
"step": 3225,
"valid_targets_mean": 5652.8,
"valid_targets_min": 2067
},
{
"epoch": 5.168,
"grad_norm": 0.44356890901584595,
"learning_rate": 7.795776126396284e-06,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2722322344779968,
"step": 3230,
"valid_targets_mean": 5946.8,
"valid_targets_min": 2419
},
{
"epoch": 5.176,
"grad_norm": 0.4752087181203412,
"learning_rate": 7.732655459917726e-06,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.251334011554718,
"step": 3235,
"valid_targets_mean": 6202.1,
"valid_targets_min": 2143
},
{
"epoch": 5.184,
"grad_norm": 0.47330365224350573,
"learning_rate": 7.669730073954005e-06,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25445556640625,
"step": 3240,
"valid_targets_mean": 4800.8,
"valid_targets_min": 1979
},
{
"epoch": 5.192,
"grad_norm": 0.4241113042867172,
"learning_rate": 7.607000970197194e-06,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26085883378982544,
"step": 3245,
"valid_targets_mean": 6422.4,
"valid_targets_min": 3359
},
{
"epoch": 5.2,
"grad_norm": 0.4082829197550291,
"learning_rate": 7.544469147214797e-06,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23965823650360107,
"step": 3250,
"valid_targets_mean": 5750.3,
"valid_targets_min": 2589
},
{
"epoch": 5.208,
"grad_norm": 0.4212938893338529,
"learning_rate": 7.482135600433868e-06,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2490275353193283,
"step": 3255,
"valid_targets_mean": 5702.0,
"valid_targets_min": 1607
},
{
"epoch": 5.216,
"grad_norm": 0.4533089451122526,
"learning_rate": 7.420001322125156e-06,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26186293363571167,
"step": 3260,
"valid_targets_mean": 5979.9,
"valid_targets_min": 965
},
{
"epoch": 5.224,
"grad_norm": 0.43280208998225644,
"learning_rate": 7.3580673013872946e-06,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2600148320198059,
"step": 3265,
"valid_targets_mean": 5992.2,
"valid_targets_min": 2637
},
{
"epoch": 5.232,
"grad_norm": 0.4285996875181488,
"learning_rate": 7.2963345241310904e-06,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24552065134048462,
"step": 3270,
"valid_targets_mean": 5952.8,
"valid_targets_min": 2993
},
{
"epoch": 5.24,
"grad_norm": 0.4396851695342125,
"learning_rate": 7.234803973063797e-06,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2468017339706421,
"step": 3275,
"valid_targets_mean": 5339.3,
"valid_targets_min": 2045
},
{
"epoch": 5.248,
"grad_norm": 0.46885707206768734,
"learning_rate": 7.173476627673492e-06,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23570626974105835,
"step": 3280,
"valid_targets_mean": 4740.2,
"valid_targets_min": 895
},
{
"epoch": 5.256,
"grad_norm": 0.47683292662936794,
"learning_rate": 7.112353464213477e-06,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23079991340637207,
"step": 3285,
"valid_targets_mean": 4879.6,
"valid_targets_min": 781
},
{
"epoch": 5.264,
"grad_norm": 0.40296099845402256,
"learning_rate": 7.051435455686735e-06,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24319109320640564,
"step": 3290,
"valid_targets_mean": 6255.1,
"valid_targets_min": 2817
},
{
"epoch": 5.272,
"grad_norm": 0.4469612736416828,
"learning_rate": 6.990723571830438e-06,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24624331295490265,
"step": 3295,
"valid_targets_mean": 5637.4,
"valid_targets_min": 1883
},
{
"epoch": 5.28,
"grad_norm": 0.39280133547463153,
"learning_rate": 6.93021877910052e-06,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2591555118560791,
"step": 3300,
"valid_targets_mean": 6686.6,
"valid_targets_min": 2720
},
{
"epoch": 5.288,
"grad_norm": 0.4258546217009564,
"learning_rate": 6.8699220406562985e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24424447119235992,
"step": 3305,
"valid_targets_mean": 6241.3,
"valid_targets_min": 3838
},
{
"epoch": 5.296,
"grad_norm": 0.4385890742807229,
"learning_rate": 6.809834316345117e-06,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24113088846206665,
"step": 3310,
"valid_targets_mean": 5023.6,
"valid_targets_min": 3535
},
{
"epoch": 5.304,
"grad_norm": 0.43825408254424714,
"learning_rate": 6.749956562687083e-06,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31159403920173645,
"step": 3315,
"valid_targets_mean": 6687.9,
"valid_targets_min": 608
},
{
"epoch": 5.312,
"grad_norm": 0.4433569916218975,
"learning_rate": 6.690289732859841e-06,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28443658351898193,
"step": 3320,
"valid_targets_mean": 6012.2,
"valid_targets_min": 2471
},
{
"epoch": 5.32,
"grad_norm": 0.3949199572235783,
"learning_rate": 6.630834776683403e-06,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26501333713531494,
"step": 3325,
"valid_targets_mean": 6522.0,
"valid_targets_min": 1666
},
{
"epoch": 5.328,
"grad_norm": 0.4111723604366614,
"learning_rate": 6.571592640605e-06,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23842376470565796,
"step": 3330,
"valid_targets_mean": 6088.6,
"valid_targets_min": 3261
},
{
"epoch": 5.336,
"grad_norm": 0.4018640109418417,
"learning_rate": 6.512564267684061e-06,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24280548095703125,
"step": 3335,
"valid_targets_mean": 6272.4,
"valid_targets_min": 783
},
{
"epoch": 5.344,
"grad_norm": 0.399544016875131,
"learning_rate": 6.453750597577167e-06,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284124493598938,
"step": 3340,
"valid_targets_mean": 6603.8,
"valid_targets_min": 2776
},
{
"epoch": 5.352,
"grad_norm": 0.39745798572137775,
"learning_rate": 6.395152566523106e-06,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24532105028629303,
"step": 3345,
"valid_targets_mean": 5812.2,
"valid_targets_min": 818
},
{
"epoch": 5.36,
"grad_norm": 0.46784958899372814,
"learning_rate": 6.336771107327966e-06,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2436250001192093,
"step": 3350,
"valid_targets_mean": 5234.5,
"valid_targets_min": 619
},
{
"epoch": 5.368,
"grad_norm": 0.45098215369867023,
"learning_rate": 6.278607149350289e-06,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25613322854042053,
"step": 3355,
"valid_targets_mean": 5455.2,
"valid_targets_min": 2360
},
{
"epoch": 5.376,
"grad_norm": 0.43942856625352117,
"learning_rate": 6.220661618486268e-06,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24000336229801178,
"step": 3360,
"valid_targets_mean": 5367.2,
"valid_targets_min": 1183
},
{
"epoch": 5.384,
"grad_norm": 0.4523399589569011,
"learning_rate": 6.162935437155024e-06,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24709078669548035,
"step": 3365,
"valid_targets_mean": 5741.4,
"valid_targets_min": 2570
},
{
"epoch": 5.392,
"grad_norm": 0.4708562307010389,
"learning_rate": 6.105429524283901e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23900192975997925,
"step": 3370,
"valid_targets_mean": 4828.1,
"valid_targets_min": 1988
},
{
"epoch": 5.4,
"grad_norm": 0.381020756607991,
"learning_rate": 6.04814479529386e-06,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2541239261627197,
"step": 3375,
"valid_targets_mean": 6797.5,
"valid_targets_min": 3085
},
{
"epoch": 5.408,
"grad_norm": 0.46455582913065613,
"learning_rate": 5.991082162084889e-06,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606612741947174,
"step": 3380,
"valid_targets_mean": 5196.4,
"valid_targets_min": 1907
},
{
"epoch": 5.416,
"grad_norm": 0.4388471193782842,
"learning_rate": 5.934242533021499e-06,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2463933527469635,
"step": 3385,
"valid_targets_mean": 5517.2,
"valid_targets_min": 2367
},
{
"epoch": 5.424,
"grad_norm": 0.42373863816522317,
"learning_rate": 5.877626812918258e-06,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637603282928467,
"step": 3390,
"valid_targets_mean": 6460.0,
"valid_targets_min": 2931
},
{
"epoch": 5.432,
"grad_norm": 0.42564288561284036,
"learning_rate": 5.821235903025378e-06,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23866936564445496,
"step": 3395,
"valid_targets_mean": 5335.6,
"valid_targets_min": 2272
},
{
"epoch": 5.44,
"grad_norm": 0.4223958250211236,
"learning_rate": 5.765070701014391e-06,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2407655119895935,
"step": 3400,
"valid_targets_mean": 5698.6,
"valid_targets_min": 1173
},
{
"epoch": 5.448,
"grad_norm": 0.4363438815869388,
"learning_rate": 5.709132100963841e-06,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24764753878116608,
"step": 3405,
"valid_targets_mean": 5587.6,
"valid_targets_min": 1994
},
{
"epoch": 5.456,
"grad_norm": 0.4265485440426739,
"learning_rate": 5.653420993345062e-06,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25707298517227173,
"step": 3410,
"valid_targets_mean": 5705.9,
"valid_targets_min": 1607
},
{
"epoch": 5.464,
"grad_norm": 0.42927725568540487,
"learning_rate": 5.597938265007994e-06,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565683126449585,
"step": 3415,
"valid_targets_mean": 5731.8,
"valid_targets_min": 763
},
{
"epoch": 5.4719999999999995,
"grad_norm": 0.42083810722984627,
"learning_rate": 5.542684799167069e-06,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2680370807647705,
"step": 3420,
"valid_targets_mean": 5880.8,
"valid_targets_min": 2995
},
{
"epoch": 5.48,
"grad_norm": 0.397286313684561,
"learning_rate": 5.487661475387152e-06,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509041726589203,
"step": 3425,
"valid_targets_mean": 6285.8,
"valid_targets_min": 1872
},
{
"epoch": 5.4879999999999995,
"grad_norm": 0.4187203152823719,
"learning_rate": 5.432869169569541e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23192846775054932,
"step": 3430,
"valid_targets_mean": 5728.9,
"valid_targets_min": 2062
},
{
"epoch": 5.496,
"grad_norm": 0.4240392250819973,
"learning_rate": 5.378308753938024e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23642998933792114,
"step": 3435,
"valid_targets_mean": 5666.9,
"valid_targets_min": 2092
},
{
"epoch": 5.504,
"grad_norm": 0.45571623112464904,
"learning_rate": 5.323981097024986e-06,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24621962010860443,
"step": 3440,
"valid_targets_mean": 5369.1,
"valid_targets_min": 2968
},
{
"epoch": 5.5120000000000005,
"grad_norm": 0.43171822203395027,
"learning_rate": 5.269887063657595e-06,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2391555905342102,
"step": 3445,
"valid_targets_mean": 5589.8,
"valid_targets_min": 907
},
{
"epoch": 5.52,
"grad_norm": 0.4275681474717406,
"learning_rate": 5.216027514944027e-06,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24127346277236938,
"step": 3450,
"valid_targets_mean": 5519.3,
"valid_targets_min": 1018
},
{
"epoch": 5.5280000000000005,
"grad_norm": 0.41944732345815783,
"learning_rate": 5.162403308259767e-06,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24043628573417664,
"step": 3455,
"valid_targets_mean": 6375.5,
"valid_targets_min": 3478
},
{
"epoch": 5.536,
"grad_norm": 0.43002550469332923,
"learning_rate": 5.109015297233935e-06,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23204442858695984,
"step": 3460,
"valid_targets_mean": 5087.3,
"valid_targets_min": 901
},
{
"epoch": 5.5440000000000005,
"grad_norm": 0.4431970324561754,
"learning_rate": 5.055864331735736e-06,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24048209190368652,
"step": 3465,
"valid_targets_mean": 5482.9,
"valid_targets_min": 1870
},
{
"epoch": 5.552,
"grad_norm": 0.3920844129704998,
"learning_rate": 5.002951257860909e-06,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24493908882141113,
"step": 3470,
"valid_targets_mean": 6554.7,
"valid_targets_min": 2038
},
{
"epoch": 5.5600000000000005,
"grad_norm": 0.4181462899118393,
"learning_rate": 4.950276917918256e-06,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24973033368587494,
"step": 3475,
"valid_targets_mean": 5991.9,
"valid_targets_min": 3047
},
{
"epoch": 5.568,
"grad_norm": 0.45794713136570736,
"learning_rate": 4.8978421504162385e-06,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23978012800216675,
"step": 3480,
"valid_targets_mean": 4957.3,
"valid_targets_min": 2608
},
{
"epoch": 5.576,
"grad_norm": 0.3923396821974702,
"learning_rate": 4.845647790049634e-06,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23957261443138123,
"step": 3485,
"valid_targets_mean": 6061.6,
"valid_targets_min": 2531
},
{
"epoch": 5.584,
"grad_norm": 0.4800708463038158,
"learning_rate": 4.793694667686244e-06,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572818398475647,
"step": 3490,
"valid_targets_mean": 5308.6,
"valid_targets_min": 687
},
{
"epoch": 5.592,
"grad_norm": 0.4109993468120257,
"learning_rate": 4.741983610353664e-06,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21713688969612122,
"step": 3495,
"valid_targets_mean": 5530.6,
"valid_targets_min": 2402
},
{
"epoch": 5.6,
"grad_norm": 0.4372650094791484,
"learning_rate": 4.690515441226122e-06,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23960278928279877,
"step": 3500,
"valid_targets_mean": 5337.7,
"valid_targets_min": 1942
},
{
"epoch": 5.608,
"grad_norm": 0.46819765052374257,
"learning_rate": 4.639290979611379e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22429856657981873,
"step": 3505,
"valid_targets_mean": 4855.4,
"valid_targets_min": 2284
},
{
"epoch": 5.616,
"grad_norm": 0.4041069980782639,
"learning_rate": 4.588311040937683e-06,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2593272924423218,
"step": 3510,
"valid_targets_mean": 6654.3,
"valid_targets_min": 4808
},
{
"epoch": 5.624,
"grad_norm": 0.44503285983742874,
"learning_rate": 4.537576436740783e-06,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24970743060112,
"step": 3515,
"valid_targets_mean": 5985.1,
"valid_targets_min": 2545
},
{
"epoch": 5.632,
"grad_norm": 0.4717360114114379,
"learning_rate": 4.487087974651016e-06,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23342707753181458,
"step": 3520,
"valid_targets_mean": 4694.1,
"valid_targets_min": 2567
},
{
"epoch": 5.64,
"grad_norm": 0.4706677633097796,
"learning_rate": 4.436846458380455e-06,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2343820333480835,
"step": 3525,
"valid_targets_mean": 4799.3,
"valid_targets_min": 876
},
{
"epoch": 5.648,
"grad_norm": 0.41331820998430824,
"learning_rate": 4.386852687710104e-06,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2305280566215515,
"step": 3530,
"valid_targets_mean": 5371.6,
"valid_targets_min": 2276
},
{
"epoch": 5.656,
"grad_norm": 0.43830938492589083,
"learning_rate": 4.337107458477177e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2581741213798523,
"step": 3535,
"valid_targets_mean": 5969.8,
"valid_targets_min": 3700
},
{
"epoch": 5.664,
"grad_norm": 0.39718001494210303,
"learning_rate": 4.287611562562422e-06,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2551124393939972,
"step": 3540,
"valid_targets_mean": 6743.6,
"valid_targets_min": 2610
},
{
"epoch": 5.672,
"grad_norm": 0.47799147623395644,
"learning_rate": 4.238365787877516e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615952491760254,
"step": 3545,
"valid_targets_mean": 5030.4,
"valid_targets_min": 2079
},
{
"epoch": 5.68,
"grad_norm": 0.43097924186117664,
"learning_rate": 4.189370918352531e-06,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23403191566467285,
"step": 3550,
"valid_targets_mean": 5988.9,
"valid_targets_min": 2722
},
{
"epoch": 5.688,
"grad_norm": 0.43364358762558836,
"learning_rate": 4.140627733923439e-06,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24536678194999695,
"step": 3555,
"valid_targets_mean": 5547.0,
"valid_targets_min": 2828
},
{
"epoch": 5.696,
"grad_norm": 0.380117459617515,
"learning_rate": 4.092137010519712e-06,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2651956081390381,
"step": 3560,
"valid_targets_mean": 6673.7,
"valid_targets_min": 2056
},
{
"epoch": 5.704,
"grad_norm": 0.37672052137731615,
"learning_rate": 4.043899520051964e-06,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2500587999820709,
"step": 3565,
"valid_targets_mean": 6525.6,
"valid_targets_min": 1040
},
{
"epoch": 5.712,
"grad_norm": 0.42491726304200406,
"learning_rate": 3.995916030399658e-06,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2274150550365448,
"step": 3570,
"valid_targets_mean": 5182.4,
"valid_targets_min": 699
},
{
"epoch": 5.72,
"grad_norm": 0.42850700678468717,
"learning_rate": 3.948187305398892e-06,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2219313681125641,
"step": 3575,
"valid_targets_mean": 5911.5,
"valid_targets_min": 2882
},
{
"epoch": 5.728,
"grad_norm": 0.44052850311666414,
"learning_rate": 3.90071410483023e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25418415665626526,
"step": 3580,
"valid_targets_mean": 5418.7,
"valid_targets_min": 1666
},
{
"epoch": 5.736,
"grad_norm": 0.43430539148105113,
"learning_rate": 3.853497184406623e-06,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542496919631958,
"step": 3585,
"valid_targets_mean": 5782.9,
"valid_targets_min": 2622
},
{
"epoch": 5.744,
"grad_norm": 0.4378276109822209,
"learning_rate": 3.80653729576135e-06,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23649832606315613,
"step": 3590,
"valid_targets_mean": 5274.5,
"valid_targets_min": 2480
},
{
"epoch": 5.752,
"grad_norm": 0.4762535210324838,
"learning_rate": 3.7598351864360872e-06,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23490282893180847,
"step": 3595,
"valid_targets_mean": 4631.4,
"valid_targets_min": 802
},
{
"epoch": 5.76,
"grad_norm": 0.4509017959893099,
"learning_rate": 3.713391599868985e-06,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23814690113067627,
"step": 3600,
"valid_targets_mean": 5169.4,
"valid_targets_min": 740
},
{
"epoch": 5.768,
"grad_norm": 0.4171862673978773,
"learning_rate": 3.6672072753828424e-06,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2462296038866043,
"step": 3605,
"valid_targets_mean": 5297.6,
"valid_targets_min": 1668
},
{
"epoch": 5.776,
"grad_norm": 0.4256809301759758,
"learning_rate": 3.6212829481733368e-06,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24445554614067078,
"step": 3610,
"valid_targets_mean": 5463.2,
"valid_targets_min": 2316
},
{
"epoch": 5.784,
"grad_norm": 0.4167025170439137,
"learning_rate": 3.575619349297317e-06,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21641194820404053,
"step": 3615,
"valid_targets_mean": 5376.2,
"valid_targets_min": 533
},
{
"epoch": 5.792,
"grad_norm": 0.4206073504201526,
"learning_rate": 3.5302172056611682e-06,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27774128317832947,
"step": 3620,
"valid_targets_mean": 6891.8,
"valid_targets_min": 740
},
{
"epoch": 5.8,
"grad_norm": 0.4575929196736855,
"learning_rate": 3.485077240009247e-06,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605830132961273,
"step": 3625,
"valid_targets_mean": 5522.7,
"valid_targets_min": 761
},
{
"epoch": 5.808,
"grad_norm": 0.461225529092125,
"learning_rate": 3.4402001709123643e-06,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2431730031967163,
"step": 3630,
"valid_targets_mean": 5088.9,
"valid_targets_min": 2248
},
{
"epoch": 5.816,
"grad_norm": 0.4126669360245022,
"learning_rate": 3.3955867127563515e-06,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25011661648750305,
"step": 3635,
"valid_targets_mean": 6407.1,
"valid_targets_min": 2470
},
{
"epoch": 5.824,
"grad_norm": 0.4448568564700826,
"learning_rate": 3.351237575730695e-06,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2398379147052765,
"step": 3640,
"valid_targets_mean": 5172.5,
"valid_targets_min": 798
},
{
"epoch": 5.832,
"grad_norm": 0.4143753113371597,
"learning_rate": 3.307153465817219e-06,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23666608333587646,
"step": 3645,
"valid_targets_mean": 5480.1,
"valid_targets_min": 2095
},
{
"epoch": 5.84,
"grad_norm": 0.4753065577157038,
"learning_rate": 3.263335084778856e-06,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26486414670944214,
"step": 3650,
"valid_targets_mean": 5145.8,
"valid_targets_min": 532
},
{
"epoch": 5.848,
"grad_norm": 0.4785539397504414,
"learning_rate": 3.2197831301484816e-06,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2624918818473816,
"step": 3655,
"valid_targets_mean": 5236.1,
"valid_targets_min": 704
},
{
"epoch": 5.856,
"grad_norm": 0.43901540322621985,
"learning_rate": 3.1764982952177805e-06,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.253711462020874,
"step": 3660,
"valid_targets_mean": 6207.4,
"valid_targets_min": 3493
},
{
"epoch": 5.864,
"grad_norm": 0.46334079040298753,
"learning_rate": 3.1334812690262507e-06,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2284860759973526,
"step": 3665,
"valid_targets_mean": 4962.0,
"valid_targets_min": 1970
},
{
"epoch": 5.872,
"grad_norm": 0.41129202818307,
"learning_rate": 3.0907327363502084e-06,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24177731573581696,
"step": 3670,
"valid_targets_mean": 5679.8,
"valid_targets_min": 2740
},
{
"epoch": 5.88,
"grad_norm": 0.4405933411516817,
"learning_rate": 3.0482533776918987e-06,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2584155201911926,
"step": 3675,
"valid_targets_mean": 5422.5,
"valid_targets_min": 2514
},
{
"epoch": 5.888,
"grad_norm": 0.38587475298350843,
"learning_rate": 3.0060438692686533e-06,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2485569566488266,
"step": 3680,
"valid_targets_mean": 6428.7,
"valid_targets_min": 2191
},
{
"epoch": 5.896,
"grad_norm": 0.4507232955476526,
"learning_rate": 2.964104883002139e-06,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26484763622283936,
"step": 3685,
"valid_targets_mean": 5712.8,
"valid_targets_min": 2328
},
{
"epoch": 5.904,
"grad_norm": 0.43487093323288945,
"learning_rate": 2.9224370865076457e-06,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25088346004486084,
"step": 3690,
"valid_targets_mean": 5280.4,
"valid_targets_min": 2833
},
{
"epoch": 5.912,
"grad_norm": 0.46366305358427945,
"learning_rate": 2.8810411430834716e-06,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23430442810058594,
"step": 3695,
"valid_targets_mean": 4903.6,
"valid_targets_min": 2845
},
{
"epoch": 5.92,
"grad_norm": 0.45953163223662696,
"learning_rate": 2.8399177117003595e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21741312742233276,
"step": 3700,
"valid_targets_mean": 4953.9,
"valid_targets_min": 524
},
{
"epoch": 5.928,
"grad_norm": 0.39124968173123453,
"learning_rate": 2.7990674469910085e-06,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2448250949382782,
"step": 3705,
"valid_targets_mean": 6150.7,
"valid_targets_min": 2248
},
{
"epoch": 5.936,
"grad_norm": 0.35502781214246365,
"learning_rate": 2.7584909992396515e-06,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26683682203292847,
"step": 3710,
"valid_targets_mean": 7718.4,
"valid_targets_min": 3037
},
{
"epoch": 5.944,
"grad_norm": 0.39446290087026825,
"learning_rate": 2.7181890143716995e-06,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26290997862815857,
"step": 3715,
"valid_targets_mean": 6427.1,
"valid_targets_min": 3224
},
{
"epoch": 5.952,
"grad_norm": 0.47638170497550425,
"learning_rate": 2.6781621339434717e-06,
"loss": 0.2401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23213085532188416,
"step": 3720,
"valid_targets_mean": 4806.5,
"valid_targets_min": 647
},
{
"epoch": 5.96,
"grad_norm": 0.4267363318221976,
"learning_rate": 2.638410995131966e-06,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26729530096054077,
"step": 3725,
"valid_targets_mean": 5881.9,
"valid_targets_min": 2237
},
{
"epoch": 5.968,
"grad_norm": 0.4179471638601527,
"learning_rate": 2.5989362307247313e-06,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26390784978866577,
"step": 3730,
"valid_targets_mean": 6047.1,
"valid_targets_min": 3510
},
{
"epoch": 5.976,
"grad_norm": 0.40078466530949025,
"learning_rate": 2.5597384691097847e-06,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24570685625076294,
"step": 3735,
"valid_targets_mean": 6009.8,
"valid_targets_min": 707
},
{
"epoch": 5.984,
"grad_norm": 0.4225593036828595,
"learning_rate": 2.520818334265611e-06,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25478851795196533,
"step": 3740,
"valid_targets_mean": 5721.6,
"valid_targets_min": 3165
},
{
"epoch": 5.992,
"grad_norm": 0.44828897669175494,
"learning_rate": 2.482176445751232e-06,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24662527441978455,
"step": 3745,
"valid_targets_mean": 5301.8,
"valid_targets_min": 1841
},
{
"epoch": 6.0,
"grad_norm": 0.424666922649159,
"learning_rate": 2.4438134186963415e-06,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27201324701309204,
"step": 3750,
"valid_targets_mean": 5872.3,
"valid_targets_min": 2475
},
{
"epoch": 6.008,
"grad_norm": 0.45619535275351364,
"learning_rate": 2.4057298637915105e-06,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2112616002559662,
"step": 3755,
"valid_targets_mean": 4857.0,
"valid_targets_min": 2365
},
{
"epoch": 6.016,
"grad_norm": 0.4367115638555302,
"learning_rate": 2.3679263872784717e-06,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25617077946662903,
"step": 3760,
"valid_targets_mean": 4926.6,
"valid_targets_min": 273
},
{
"epoch": 6.024,
"grad_norm": 0.45303009142719136,
"learning_rate": 2.330403590940471e-06,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148558735847473,
"step": 3765,
"valid_targets_mean": 6289.8,
"valid_targets_min": 988
},
{
"epoch": 6.032,
"grad_norm": 0.42543736613890915,
"learning_rate": 2.2931620720926717e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525025010108948,
"step": 3770,
"valid_targets_mean": 5580.8,
"valid_targets_min": 2635
},
{
"epoch": 6.04,
"grad_norm": 0.4352315343427995,
"learning_rate": 2.256202423572669e-06,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24089187383651733,
"step": 3775,
"valid_targets_mean": 5376.5,
"valid_targets_min": 598
},
{
"epoch": 6.048,
"grad_norm": 0.430712579222173,
"learning_rate": 2.219525233731035e-06,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24066440761089325,
"step": 3780,
"valid_targets_mean": 5657.6,
"valid_targets_min": 859
},
{
"epoch": 6.056,
"grad_norm": 0.4785332476153452,
"learning_rate": 2.183131086421961e-06,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637433409690857,
"step": 3785,
"valid_targets_mean": 5608.4,
"valid_targets_min": 3189
},
{
"epoch": 6.064,
"grad_norm": 0.4750185463565966,
"learning_rate": 2.1470205609939533e-06,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24166584014892578,
"step": 3790,
"valid_targets_mean": 5490.9,
"valid_targets_min": 2950
},
{
"epoch": 6.072,
"grad_norm": 0.3827437754884297,
"learning_rate": 2.1111942322806335e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24897339940071106,
"step": 3795,
"valid_targets_mean": 6231.8,
"valid_targets_min": 2760
},
{
"epoch": 6.08,
"grad_norm": 0.3816212526244572,
"learning_rate": 2.0756526705915635e-06,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28404420614242554,
"step": 3800,
"valid_targets_mean": 7391.5,
"valid_targets_min": 4361
},
{
"epoch": 6.088,
"grad_norm": 0.45028360119094746,
"learning_rate": 2.0403964417031764e-06,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22149428725242615,
"step": 3805,
"valid_targets_mean": 4898.4,
"valid_targets_min": 2070
},
{
"epoch": 6.096,
"grad_norm": 0.4285819585903812,
"learning_rate": 2.0054261068497773e-06,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23075240850448608,
"step": 3810,
"valid_targets_mean": 5468.2,
"valid_targets_min": 2258
},
{
"epoch": 6.104,
"grad_norm": 0.40077819783213,
"learning_rate": 1.9707422227145922e-06,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23339712619781494,
"step": 3815,
"valid_targets_mean": 6263.2,
"valid_targets_min": 676
},
{
"epoch": 6.112,
"grad_norm": 0.4548643615766851,
"learning_rate": 1.936345341420924e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2526797652244568,
"step": 3820,
"valid_targets_mean": 5243.7,
"valid_targets_min": 1971
},
{
"epoch": 6.12,
"grad_norm": 0.4318025930934668,
"learning_rate": 1.9022360105233507e-06,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24329990148544312,
"step": 3825,
"valid_targets_mean": 5584.3,
"valid_targets_min": 2735
},
{
"epoch": 6.128,
"grad_norm": 0.42527366921476684,
"learning_rate": 1.8684147729990188e-06,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2661643326282501,
"step": 3830,
"valid_targets_mean": 5815.2,
"valid_targets_min": 2130
},
{
"epoch": 6.136,
"grad_norm": 0.46563230810045014,
"learning_rate": 1.8348821672389893e-06,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23695829510688782,
"step": 3835,
"valid_targets_mean": 4932.8,
"valid_targets_min": 721
},
{
"epoch": 6.144,
"grad_norm": 0.49593615366135946,
"learning_rate": 1.8016387270396784e-06,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24340695142745972,
"step": 3840,
"valid_targets_mean": 4821.8,
"valid_targets_min": 1607
},
{
"epoch": 6.152,
"grad_norm": 0.4101378057435764,
"learning_rate": 1.7686849815943486e-06,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23768271505832672,
"step": 3845,
"valid_targets_mean": 5658.8,
"valid_targets_min": 1018
},
{
"epoch": 6.16,
"grad_norm": 0.40398041857114947,
"learning_rate": 1.7360214554847e-06,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2318260818719864,
"step": 3850,
"valid_targets_mean": 5986.0,
"valid_targets_min": 1597
},
{
"epoch": 6.168,
"grad_norm": 0.3896245352440973,
"learning_rate": 1.703648668672495e-06,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25532662868499756,
"step": 3855,
"valid_targets_mean": 6799.4,
"valid_targets_min": 4356
},
{
"epoch": 6.176,
"grad_norm": 0.47023459730054107,
"learning_rate": 1.6715671364913077e-06,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25101006031036377,
"step": 3860,
"valid_targets_mean": 5093.5,
"valid_targets_min": 2197
},
{
"epoch": 6.184,
"grad_norm": 0.4725640485374112,
"learning_rate": 1.6397773696383091e-06,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261438250541687,
"step": 3865,
"valid_targets_mean": 5164.5,
"valid_targets_min": 2718
},
{
"epoch": 6.192,
"grad_norm": 0.3777763013538414,
"learning_rate": 1.6082798741661321e-06,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24589067697525024,
"step": 3870,
"valid_targets_mean": 6304.3,
"valid_targets_min": 2316
},
{
"epoch": 6.2,
"grad_norm": 0.4141398897239025,
"learning_rate": 1.5770751514748273e-06,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2230231761932373,
"step": 3875,
"valid_targets_mean": 6024.8,
"valid_targets_min": 2746
},
{
"epoch": 6.208,
"grad_norm": 0.5268906276378791,
"learning_rate": 1.5461636983038686e-06,
"loss": 0.237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20659932494163513,
"step": 3880,
"valid_targets_mean": 4485.9,
"valid_targets_min": 746
},
{
"epoch": 6.216,
"grad_norm": 0.4538584693912728,
"learning_rate": 1.5155460067242578e-06,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24113240838050842,
"step": 3885,
"valid_targets_mean": 5059.6,
"valid_targets_min": 2210
},
{
"epoch": 6.224,
"grad_norm": 0.4186097232034136,
"learning_rate": 1.4852225641306816e-06,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23600910604000092,
"step": 3890,
"valid_targets_mean": 5368.4,
"valid_targets_min": 2607
},
{
"epoch": 6.232,
"grad_norm": 0.39080225059366364,
"learning_rate": 1.4551938532337607e-06,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22949565947055817,
"step": 3895,
"valid_targets_mean": 6097.4,
"valid_targets_min": 2321
},
{
"epoch": 6.24,
"grad_norm": 0.40327121453751646,
"learning_rate": 1.4254603520523614e-06,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2395782172679901,
"step": 3900,
"valid_targets_mean": 5384.2,
"valid_targets_min": 1669
},
{
"epoch": 6.248,
"grad_norm": 0.46323326452197255,
"learning_rate": 1.3960225339059875e-06,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2367008924484253,
"step": 3905,
"valid_targets_mean": 4857.9,
"valid_targets_min": 2263
},
{
"epoch": 6.256,
"grad_norm": 0.4669508465968655,
"learning_rate": 1.3668808674072409e-06,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24488641321659088,
"step": 3910,
"valid_targets_mean": 5089.0,
"valid_targets_min": 607
},
{
"epoch": 6.264,
"grad_norm": 0.4185297696425607,
"learning_rate": 1.338035816454375e-06,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515830993652344,
"step": 3915,
"valid_targets_mean": 6029.6,
"valid_targets_min": 548
},
{
"epoch": 6.272,
"grad_norm": 0.38594773761023776,
"learning_rate": 1.3094878402238887e-06,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24694006145000458,
"step": 3920,
"valid_targets_mean": 6196.4,
"valid_targets_min": 2614
},
{
"epoch": 6.28,
"grad_norm": 0.47584759172344404,
"learning_rate": 1.2812373931632371e-06,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2393854856491089,
"step": 3925,
"valid_targets_mean": 4695.4,
"valid_targets_min": 2014
},
{
"epoch": 6.288,
"grad_norm": 0.39590185736913047,
"learning_rate": 1.2532849249835932e-06,
"loss": 0.2406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512339949607849,
"step": 3930,
"valid_targets_mean": 6472.1,
"valid_targets_min": 2398
},
{
"epoch": 6.296,
"grad_norm": 0.37945048971948964,
"learning_rate": 1.2256308806526774e-06,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25047585368156433,
"step": 3935,
"valid_targets_mean": 6452.8,
"valid_targets_min": 1215
},
{
"epoch": 6.304,
"grad_norm": 0.4387172990204296,
"learning_rate": 1.1982757003876855e-06,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23491425812244415,
"step": 3940,
"valid_targets_mean": 5545.7,
"valid_targets_min": 885
},
{
"epoch": 6.312,
"grad_norm": 0.4469901316225646,
"learning_rate": 1.1712198196482793e-06,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23085957765579224,
"step": 3945,
"valid_targets_mean": 5547.8,
"valid_targets_min": 3023
},
{
"epoch": 6.32,
"grad_norm": 0.4603135179912558,
"learning_rate": 1.1444636691296518e-06,
"loss": 0.2379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24019691348075867,
"step": 3950,
"valid_targets_mean": 4919.2,
"valid_targets_min": 724
},
{
"epoch": 6.328,
"grad_norm": 0.4438177637134314,
"learning_rate": 1.11800767475567e-06,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2676534652709961,
"step": 3955,
"valid_targets_mean": 5193.1,
"valid_targets_min": 920
},
{
"epoch": 6.336,
"grad_norm": 0.4199267913461744,
"learning_rate": 1.0918522576721014e-06,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24460649490356445,
"step": 3960,
"valid_targets_mean": 5347.7,
"valid_targets_min": 763
},
{
"epoch": 6.344,
"grad_norm": 0.4948993768878234,
"learning_rate": 1.0659978342399003e-06,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27012935280799866,
"step": 3965,
"valid_targets_mean": 4998.6,
"valid_targets_min": 2627
},
{
"epoch": 6.352,
"grad_norm": 0.4098695529895006,
"learning_rate": 1.0404448160285897e-06,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2442832738161087,
"step": 3970,
"valid_targets_mean": 6394.7,
"valid_targets_min": 2311
},
{
"epoch": 6.36,
"grad_norm": 0.4346467043954532,
"learning_rate": 1.0151936098097015e-06,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26824837923049927,
"step": 3975,
"valid_targets_mean": 5873.1,
"valid_targets_min": 2276
},
{
"epoch": 6.368,
"grad_norm": 0.4513988008025312,
"learning_rate": 9.902446175503089e-07,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2434309720993042,
"step": 3980,
"valid_targets_mean": 5546.4,
"valid_targets_min": 1814
},
{
"epoch": 6.376,
"grad_norm": 0.41241583616978356,
"learning_rate": 9.655982364066197e-07,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2734718322753906,
"step": 3985,
"valid_targets_mean": 6247.4,
"valid_targets_min": 3358
},
{
"epoch": 6.384,
"grad_norm": 0.5047686747359263,
"learning_rate": 9.412548587176595e-07,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22194236516952515,
"step": 3990,
"valid_targets_mean": 5368.3,
"valid_targets_min": 2132
},
{
"epoch": 6.392,
"grad_norm": 0.44151918846121585,
"learning_rate": 9.172148719990237e-07,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2182375192642212,
"step": 3995,
"valid_targets_mean": 4883.4,
"valid_targets_min": 742
},
{
"epoch": 6.4,
"grad_norm": 0.41520968471331116,
"learning_rate": 8.934786589367106e-07,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22132691740989685,
"step": 4000,
"valid_targets_mean": 5478.4,
"valid_targets_min": 913
},
{
"epoch": 6.408,
"grad_norm": 0.48850525017353114,
"learning_rate": 8.700465973810246e-07,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22604086995124817,
"step": 4005,
"valid_targets_mean": 4439.8,
"valid_targets_min": 647
},
{
"epoch": 6.416,
"grad_norm": 0.47475359432399017,
"learning_rate": 8.469190603405719e-07,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260003924369812,
"step": 4010,
"valid_targets_mean": 5379.8,
"valid_targets_min": 862
},
{
"epoch": 6.424,
"grad_norm": 0.4224315307842758,
"learning_rate": 8.240964159763121e-07,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2336377203464508,
"step": 4015,
"valid_targets_mean": 5360.7,
"valid_targets_min": 647
},
{
"epoch": 6.432,
"grad_norm": 0.44447996013306695,
"learning_rate": 8.015790275957003e-07,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2225901037454605,
"step": 4020,
"valid_targets_mean": 5149.2,
"valid_targets_min": 2655
},
{
"epoch": 6.44,
"grad_norm": 0.4238855863067296,
"learning_rate": 7.793672536469077e-07,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21927297115325928,
"step": 4025,
"valid_targets_mean": 5357.9,
"valid_targets_min": 2314
},
{
"epoch": 6.448,
"grad_norm": 0.4830003944984125,
"learning_rate": 7.574614477131081e-07,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2570672333240509,
"step": 4030,
"valid_targets_mean": 4749.3,
"valid_targets_min": 965
},
{
"epoch": 6.456,
"grad_norm": 0.40887871261527975,
"learning_rate": 7.358619585068583e-07,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2433190941810608,
"step": 4035,
"valid_targets_mean": 6246.4,
"valid_targets_min": 3007
},
{
"epoch": 6.464,
"grad_norm": 0.3859653370068934,
"learning_rate": 7.145691298645419e-07,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24633197486400604,
"step": 4040,
"valid_targets_mean": 7010.8,
"valid_targets_min": 3496
},
{
"epoch": 6.4719999999999995,
"grad_norm": 0.38681864849268677,
"learning_rate": 6.935833007408965e-07,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2680492699146271,
"step": 4045,
"valid_targets_mean": 6608.4,
"valid_targets_min": 613
},
{
"epoch": 6.48,
"grad_norm": 0.4460709435308017,
"learning_rate": 6.729048052036136e-07,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533029317855835,
"step": 4050,
"valid_targets_mean": 5791.8,
"valid_targets_min": 1604
},
{
"epoch": 6.4879999999999995,
"grad_norm": 0.3943743836605657,
"learning_rate": 6.52533972428031e-07,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23628069460391998,
"step": 4055,
"valid_targets_mean": 6551.3,
"valid_targets_min": 2696
},
{
"epoch": 6.496,
"grad_norm": 0.4312618998760607,
"learning_rate": 6.324711266918826e-07,
"loss": 0.2396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25112444162368774,
"step": 4060,
"valid_targets_mean": 5862.1,
"valid_targets_min": 2993
},
{
"epoch": 6.504,
"grad_norm": 0.483174829368675,
"learning_rate": 6.127165873701457e-07,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23675619065761566,
"step": 4065,
"valid_targets_mean": 4392.4,
"valid_targets_min": 901
},
{
"epoch": 6.5120000000000005,
"grad_norm": 0.4197944086659229,
"learning_rate": 5.932706689299461e-07,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2547464668750763,
"step": 4070,
"valid_targets_mean": 5488.9,
"valid_targets_min": 2215
},
{
"epoch": 6.52,
"grad_norm": 0.33766862446417356,
"learning_rate": 5.741336809255615e-07,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25667327642440796,
"step": 4075,
"valid_targets_mean": 7697.0,
"valid_targets_min": 2813
},
{
"epoch": 6.5280000000000005,
"grad_norm": 0.4533360710834701,
"learning_rate": 5.553059279934902e-07,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22701610624790192,
"step": 4080,
"valid_targets_mean": 5237.2,
"valid_targets_min": 1011
},
{
"epoch": 6.536,
"grad_norm": 0.3726240899705432,
"learning_rate": 5.36787709847597e-07,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2350490689277649,
"step": 4085,
"valid_targets_mean": 6899.0,
"valid_targets_min": 3302
},
{
"epoch": 6.5440000000000005,
"grad_norm": 0.421250464481422,
"learning_rate": 5.185793212743529e-07,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310941517353058,
"step": 4090,
"valid_targets_mean": 5545.6,
"valid_targets_min": 2301
},
{
"epoch": 6.552,
"grad_norm": 0.45769843975283325,
"learning_rate": 5.006810521281335e-07,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2067297399044037,
"step": 4095,
"valid_targets_mean": 4581.6,
"valid_targets_min": 907
},
{
"epoch": 6.5600000000000005,
"grad_norm": 0.4005818383542897,
"learning_rate": 4.830931873266065e-07,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23793132603168488,
"step": 4100,
"valid_targets_mean": 5918.6,
"valid_targets_min": 611
},
{
"epoch": 6.568,
"grad_norm": 0.39937305590430555,
"learning_rate": 4.658160068462025e-07,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2463841736316681,
"step": 4105,
"valid_targets_mean": 6267.2,
"valid_targets_min": 3317
},
{
"epoch": 6.576,
"grad_norm": 0.32626143813018726,
"learning_rate": 4.488497857176466e-07,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2482718527317047,
"step": 4110,
"valid_targets_mean": 7305.4,
"valid_targets_min": 542
},
{
"epoch": 6.584,
"grad_norm": 0.4539225656394375,
"learning_rate": 4.321947940215898e-07,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23661956191062927,
"step": 4115,
"valid_targets_mean": 5279.0,
"valid_targets_min": 2007
},
{
"epoch": 6.592,
"grad_norm": 0.4344850114515945,
"learning_rate": 4.1585129688430425e-07,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24658052623271942,
"step": 4120,
"valid_targets_mean": 5324.8,
"valid_targets_min": 549
},
{
"epoch": 6.6,
"grad_norm": 0.39310146860493744,
"learning_rate": 3.998195544734706e-07,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24207232892513275,
"step": 4125,
"valid_targets_mean": 6842.8,
"valid_targets_min": 2210
},
{
"epoch": 6.608,
"grad_norm": 0.4149625856439961,
"learning_rate": 3.840998219940284e-07,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26455581188201904,
"step": 4130,
"valid_targets_mean": 5933.3,
"valid_targets_min": 2936
},
{
"epoch": 6.616,
"grad_norm": 0.4058154946023268,
"learning_rate": 3.6869234968411214e-07,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25165531039237976,
"step": 4135,
"valid_targets_mean": 5976.5,
"valid_targets_min": 766
},
{
"epoch": 6.624,
"grad_norm": 0.4120431574460261,
"learning_rate": 3.5359738281107504e-07,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24470007419586182,
"step": 4140,
"valid_targets_mean": 6167.4,
"valid_targets_min": 2083
},
{
"epoch": 6.632,
"grad_norm": 0.44621207055238954,
"learning_rate": 3.38815161667585e-07,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24108701944351196,
"step": 4145,
"valid_targets_mean": 5187.9,
"valid_targets_min": 2760
},
{
"epoch": 6.64,
"grad_norm": 0.45740673758834627,
"learning_rate": 3.24345921567788e-07,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25003916025161743,
"step": 4150,
"valid_targets_mean": 5214.8,
"valid_targets_min": 2432
},
{
"epoch": 6.648,
"grad_norm": 0.38170623989649993,
"learning_rate": 3.101898928435754e-07,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26009601354599,
"step": 4155,
"valid_targets_mean": 6232.9,
"valid_targets_min": 2900
},
{
"epoch": 6.656,
"grad_norm": 0.3949667344123087,
"learning_rate": 2.9634730084091343e-07,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2611731290817261,
"step": 4160,
"valid_targets_mean": 6492.0,
"valid_targets_min": 2597
},
{
"epoch": 6.664,
"grad_norm": 0.481054045629589,
"learning_rate": 2.8281836591624865e-07,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22188538312911987,
"step": 4165,
"valid_targets_mean": 4702.8,
"valid_targets_min": 1883
},
{
"epoch": 6.672,
"grad_norm": 0.45164701161138154,
"learning_rate": 2.6960330343301033e-07,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23218591511249542,
"step": 4170,
"valid_targets_mean": 4975.9,
"valid_targets_min": 2262
},
{
"epoch": 6.68,
"grad_norm": 0.4796809330908409,
"learning_rate": 2.5670232375817784e-07,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22703537344932556,
"step": 4175,
"valid_targets_mean": 4798.4,
"valid_targets_min": 859
},
{
"epoch": 6.688,
"grad_norm": 0.44726947654327165,
"learning_rate": 2.441156322589322e-07,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21367965638637543,
"step": 4180,
"valid_targets_mean": 5252.1,
"valid_targets_min": 2079
},
{
"epoch": 6.696,
"grad_norm": 0.4199003621464118,
"learning_rate": 2.318434292993832e-07,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2607828378677368,
"step": 4185,
"valid_targets_mean": 6629.9,
"valid_targets_min": 3995
},
{
"epoch": 6.704,
"grad_norm": 0.4016367445657586,
"learning_rate": 2.1988591023738514e-07,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26771795749664307,
"step": 4190,
"valid_targets_mean": 6307.6,
"valid_targets_min": 2672
},
{
"epoch": 6.712,
"grad_norm": 0.399715800869208,
"learning_rate": 2.0824326542142835e-07,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2620810270309448,
"step": 4195,
"valid_targets_mean": 6914.5,
"valid_targets_min": 2479
},
{
"epoch": 6.72,
"grad_norm": 0.3910519268922181,
"learning_rate": 1.9691568018759931e-07,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23408928513526917,
"step": 4200,
"valid_targets_mean": 6041.6,
"valid_targets_min": 2297
},
{
"epoch": 6.728,
"grad_norm": 0.40997014213714333,
"learning_rate": 1.8590333485664525e-07,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2437349408864975,
"step": 4205,
"valid_targets_mean": 5969.2,
"valid_targets_min": 2861
},
{
"epoch": 6.736,
"grad_norm": 0.4079184645546954,
"learning_rate": 1.752064047310853e-07,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418249547481537,
"step": 4210,
"valid_targets_mean": 5699.6,
"valid_targets_min": 3429
},
{
"epoch": 6.744,
"grad_norm": 0.437700129698411,
"learning_rate": 1.6482506009243949e-07,
"loss": 0.2466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29487597942352295,
"step": 4215,
"valid_targets_mean": 6602.3,
"valid_targets_min": 2588
},
{
"epoch": 6.752,
"grad_norm": 0.4142521640099534,
"learning_rate": 1.5475946619850192e-07,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24046289920806885,
"step": 4220,
"valid_targets_mean": 6069.1,
"valid_targets_min": 711
},
{
"epoch": 6.76,
"grad_norm": 0.41546394357679706,
"learning_rate": 1.4500978328071845e-07,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25072425603866577,
"step": 4225,
"valid_targets_mean": 5360.8,
"valid_targets_min": 428
},
{
"epoch": 6.768,
"grad_norm": 0.40151629403045647,
"learning_rate": 1.3557616654163775e-07,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2626868784427643,
"step": 4230,
"valid_targets_mean": 6657.1,
"valid_targets_min": 3302
},
{
"epoch": 6.776,
"grad_norm": 0.42833620944626843,
"learning_rate": 1.264587661524308e-07,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24112708866596222,
"step": 4235,
"valid_targets_mean": 6090.4,
"valid_targets_min": 950
},
{
"epoch": 6.784,
"grad_norm": 0.4154553942811618,
"learning_rate": 1.1765772725051084e-07,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23809021711349487,
"step": 4240,
"valid_targets_mean": 5470.9,
"valid_targets_min": 1628
},
{
"epoch": 6.792,
"grad_norm": 0.4195908754448132,
"learning_rate": 1.0917318993721726e-07,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2500789165496826,
"step": 4245,
"valid_targets_mean": 5899.9,
"valid_targets_min": 2438
},
{
"epoch": 6.8,
"grad_norm": 0.45570500783237344,
"learning_rate": 1.0100528927558861e-07,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20834442973136902,
"step": 4250,
"valid_targets_mean": 4979.1,
"valid_targets_min": 2591
},
{
"epoch": 6.808,
"grad_norm": 0.4170242154763821,
"learning_rate": 9.31541552882087e-08,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23040908575057983,
"step": 4255,
"valid_targets_mean": 5964.5,
"valid_targets_min": 2124
},
{
"epoch": 6.816,
"grad_norm": 0.4142871848307513,
"learning_rate": 8.561991295514161e-08,
"loss": 0.2444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2491617053747177,
"step": 4260,
"valid_targets_mean": 5598.0,
"valid_targets_min": 1553
},
{
"epoch": 6.824,
"grad_norm": 0.4151855097481202,
"learning_rate": 7.840268221193548e-08,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24346888065338135,
"step": 4265,
"valid_targets_mean": 6049.5,
"valid_targets_min": 2898
},
{
"epoch": 6.832,
"grad_norm": 0.4555291535355044,
"learning_rate": 7.150257794772186e-08,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24714088439941406,
"step": 4270,
"valid_targets_mean": 6723.9,
"valid_targets_min": 926
},
{
"epoch": 6.84,
"grad_norm": 0.4369171425961876,
"learning_rate": 6.491971000337938e-08,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22927583754062653,
"step": 4275,
"valid_targets_mean": 5355.7,
"valid_targets_min": 1490
},
{
"epoch": 6.848,
"grad_norm": 0.3603313297065621,
"learning_rate": 5.8654183169788435e-08,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2546162009239197,
"step": 4280,
"valid_targets_mean": 7805.7,
"valid_targets_min": 2702
},
{
"epoch": 6.856,
"grad_norm": 0.3776558735589143,
"learning_rate": 5.270609718616593e-08,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2700864374637604,
"step": 4285,
"valid_targets_mean": 7140.9,
"valid_targets_min": 2497
},
{
"epoch": 6.864,
"grad_norm": 0.3910196634027121,
"learning_rate": 4.70755467384687e-08,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2360091507434845,
"step": 4290,
"valid_targets_mean": 6045.0,
"valid_targets_min": 2924
},
{
"epoch": 6.872,
"grad_norm": 0.42067440511825865,
"learning_rate": 4.176262145789478e-08,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23304817080497742,
"step": 4295,
"valid_targets_mean": 6235.3,
"valid_targets_min": 2477
},
{
"epoch": 6.88,
"grad_norm": 0.44819785709400006,
"learning_rate": 3.676740591945782e-08,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23022767901420593,
"step": 4300,
"valid_targets_mean": 5170.4,
"valid_targets_min": 845
},
{
"epoch": 6.888,
"grad_norm": 0.38159591470198784,
"learning_rate": 3.208997964062821e-08,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266330748796463,
"step": 4305,
"valid_targets_mean": 6728.8,
"valid_targets_min": 809
},
{
"epoch": 6.896,
"grad_norm": 0.47438857326603057,
"learning_rate": 2.773041708008295e-08,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21114903688430786,
"step": 4310,
"valid_targets_mean": 4498.0,
"valid_targets_min": 714
},
{
"epoch": 6.904,
"grad_norm": 0.4169788152049192,
"learning_rate": 2.3688787636511057e-08,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2451530396938324,
"step": 4315,
"valid_targets_mean": 5779.1,
"valid_targets_min": 2389
},
{
"epoch": 6.912,
"grad_norm": 0.5314249782039797,
"learning_rate": 1.9965155647507782e-08,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24146723747253418,
"step": 4320,
"valid_targets_mean": 4286.8,
"valid_targets_min": 594
},
{
"epoch": 6.92,
"grad_norm": 0.42573633152148477,
"learning_rate": 1.655958038855765e-08,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257783442735672,
"step": 4325,
"valid_targets_mean": 5627.4,
"valid_targets_min": 881
},
{
"epoch": 6.928,
"grad_norm": 0.4097519577004155,
"learning_rate": 1.3472116072084096e-08,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23979437351226807,
"step": 4330,
"valid_targets_mean": 5950.1,
"valid_targets_min": 3580
},
{
"epoch": 6.936,
"grad_norm": 0.4454465260722158,
"learning_rate": 1.0702811846590167e-08,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2746885418891907,
"step": 4335,
"valid_targets_mean": 5342.9,
"valid_targets_min": 954
},
{
"epoch": 6.944,
"grad_norm": 0.41412006546592484,
"learning_rate": 8.251711795876916e-09,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24524347484111786,
"step": 4340,
"valid_targets_mean": 5723.5,
"valid_targets_min": 1678
},
{
"epoch": 6.952,
"grad_norm": 0.4452590210279377,
"learning_rate": 6.1188549383373044e-09,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22402501106262207,
"step": 4345,
"valid_targets_mean": 5053.6,
"valid_targets_min": 1317
},
{
"epoch": 6.96,
"grad_norm": 0.4249708336351826,
"learning_rate": 4.304275226338916e-09,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23752881586551666,
"step": 4350,
"valid_targets_mean": 5775.6,
"valid_targets_min": 729
},
{
"epoch": 6.968,
"grad_norm": 0.4351604501867694,
"learning_rate": 2.8080015456799503e-09,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2576856017112732,
"step": 4355,
"valid_targets_mean": 5823.6,
"valid_targets_min": 720
},
{
"epoch": 6.976,
"grad_norm": 0.43551585909366247,
"learning_rate": 1.6300577151340257e-09,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23403063416481018,
"step": 4360,
"valid_targets_mean": 5693.9,
"valid_targets_min": 3118
},
{
"epoch": 6.984,
"grad_norm": 0.44352689496306524,
"learning_rate": 7.70462486070489e-10,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642480134963989,
"step": 4365,
"valid_targets_mean": 6007.5,
"valid_targets_min": 2710
},
{
"epoch": 6.992,
"grad_norm": 0.41338621237648826,
"learning_rate": 2.2922954214799065e-10,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2713726758956909,
"step": 4370,
"valid_targets_mean": 6049.0,
"valid_targets_min": 2589
},
{
"epoch": 7.0,
"grad_norm": 0.4110206394678341,
"learning_rate": 6.367499107984288e-12,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23771843314170837,
"step": 4375,
"valid_targets_mean": 6046.8,
"valid_targets_min": 2950
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23771843314170837,
"step": 4375,
"total_flos": 1967928670814208.0,
"train_loss": 0.28350407949175155,
"train_runtime": 36852.1456,
"train_samples_per_second": 1.899,
"train_steps_per_second": 0.119,
"valid_targets_mean": 6046.8,
"valid_targets_min": 2950
}
],
"logging_steps": 5,
"max_steps": 4375,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1967928670814208.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}