Files
a1-nemotron_bash/trainer_state.json
ModelHub XC 179cbd0034 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-nemotron_bash
Source: Original Platform
2026-05-04 06:11:27 +08:00

9541 lines
265 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4319,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008103727714748784,
"grad_norm": 15.052451796629647,
"learning_rate": 3.7037037037037036e-07,
"loss": 0.744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7075120210647583,
"step": 5,
"valid_targets_mean": 4307.1,
"valid_targets_min": 2137
},
{
"epoch": 0.01620745542949757,
"grad_norm": 14.16077406559237,
"learning_rate": 8.333333333333333e-07,
"loss": 0.6971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7030583620071411,
"step": 10,
"valid_targets_mean": 6069.7,
"valid_targets_min": 2317
},
{
"epoch": 0.024311183144246355,
"grad_norm": 12.310953306211442,
"learning_rate": 1.2962962962962962e-06,
"loss": 0.7099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6455563306808472,
"step": 15,
"valid_targets_mean": 5927.9,
"valid_targets_min": 2198
},
{
"epoch": 0.03241491085899514,
"grad_norm": 11.75979384479062,
"learning_rate": 1.7592592592592594e-06,
"loss": 0.6609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6437151432037354,
"step": 20,
"valid_targets_mean": 5138.6,
"valid_targets_min": 1450
},
{
"epoch": 0.04051863857374392,
"grad_norm": 7.098490762665116,
"learning_rate": 2.222222222222222e-06,
"loss": 0.5954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5416496396064758,
"step": 25,
"valid_targets_mean": 4411.9,
"valid_targets_min": 1399
},
{
"epoch": 0.04862236628849271,
"grad_norm": 4.7050280865823675,
"learning_rate": 2.6851851851851856e-06,
"loss": 0.5509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5249617099761963,
"step": 30,
"valid_targets_mean": 3748.4,
"valid_targets_min": 1344
},
{
"epoch": 0.05672609400324149,
"grad_norm": 2.5302822583427482,
"learning_rate": 3.1481481481481483e-06,
"loss": 0.5361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5037345886230469,
"step": 35,
"valid_targets_mean": 4683.2,
"valid_targets_min": 1359
},
{
"epoch": 0.06482982171799027,
"grad_norm": 1.7953600503801777,
"learning_rate": 3.6111111111111115e-06,
"loss": 0.4987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4654555916786194,
"step": 40,
"valid_targets_mean": 4019.7,
"valid_targets_min": 1745
},
{
"epoch": 0.07293354943273905,
"grad_norm": 1.3040568058787088,
"learning_rate": 4.074074074074074e-06,
"loss": 0.4715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4576088786125183,
"step": 45,
"valid_targets_mean": 4056.4,
"valid_targets_min": 1336
},
{
"epoch": 0.08103727714748785,
"grad_norm": 1.1186358672828327,
"learning_rate": 4.537037037037038e-06,
"loss": 0.4492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4448954463005066,
"step": 50,
"valid_targets_mean": 3493.5,
"valid_targets_min": 944
},
{
"epoch": 0.08914100486223663,
"grad_norm": 0.8583349811923283,
"learning_rate": 5e-06,
"loss": 0.432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4754987061023712,
"step": 55,
"valid_targets_mean": 4823.1,
"valid_targets_min": 2229
},
{
"epoch": 0.09724473257698542,
"grad_norm": 0.7390069286691012,
"learning_rate": 5.462962962962963e-06,
"loss": 0.4456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43904808163642883,
"step": 60,
"valid_targets_mean": 4810.8,
"valid_targets_min": 1311
},
{
"epoch": 0.1053484602917342,
"grad_norm": 0.7415924654887941,
"learning_rate": 5.925925925925926e-06,
"loss": 0.4378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4822186231613159,
"step": 65,
"valid_targets_mean": 4482.6,
"valid_targets_min": 1182
},
{
"epoch": 0.11345218800648298,
"grad_norm": 0.6929052623611306,
"learning_rate": 6.3888888888888885e-06,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49454551935195923,
"step": 70,
"valid_targets_mean": 6779.2,
"valid_targets_min": 2081
},
{
"epoch": 0.12155591572123177,
"grad_norm": 0.6540631430503951,
"learning_rate": 6.851851851851853e-06,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35995030403137207,
"step": 75,
"valid_targets_mean": 4102.6,
"valid_targets_min": 1430
},
{
"epoch": 0.12965964343598055,
"grad_norm": 0.6110409858399266,
"learning_rate": 7.314814814814816e-06,
"loss": 0.4059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44885435700416565,
"step": 80,
"valid_targets_mean": 5470.8,
"valid_targets_min": 1387
},
{
"epoch": 0.13776337115072934,
"grad_norm": 0.6225608077350795,
"learning_rate": 7.77777777777778e-06,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4068431258201599,
"step": 85,
"valid_targets_mean": 5061.4,
"valid_targets_min": 1385
},
{
"epoch": 0.1458670988654781,
"grad_norm": 0.5508564720574586,
"learning_rate": 8.240740740740741e-06,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35934633016586304,
"step": 90,
"valid_targets_mean": 4809.6,
"valid_targets_min": 676
},
{
"epoch": 0.1539708265802269,
"grad_norm": 0.6585566821793581,
"learning_rate": 8.703703703703705e-06,
"loss": 0.3701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37526312470436096,
"step": 95,
"valid_targets_mean": 4011.1,
"valid_targets_min": 1477
},
{
"epoch": 0.1620745542949757,
"grad_norm": 0.567030762477571,
"learning_rate": 9.166666666666666e-06,
"loss": 0.3514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.367622971534729,
"step": 100,
"valid_targets_mean": 4913.1,
"valid_targets_min": 1476
},
{
"epoch": 0.17017828200972449,
"grad_norm": 0.6144227532600338,
"learning_rate": 9.62962962962963e-06,
"loss": 0.3632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3684994876384735,
"step": 105,
"valid_targets_mean": 3957.9,
"valid_targets_min": 1271
},
{
"epoch": 0.17828200972447325,
"grad_norm": 0.5569033858777038,
"learning_rate": 1.0092592592592594e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36880379915237427,
"step": 110,
"valid_targets_mean": 5144.2,
"valid_targets_min": 1418
},
{
"epoch": 0.18638573743922204,
"grad_norm": 0.636909406673007,
"learning_rate": 1.0555555555555557e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3586111068725586,
"step": 115,
"valid_targets_mean": 3771.0,
"valid_targets_min": 1440
},
{
"epoch": 0.19448946515397084,
"grad_norm": 0.5782624385183504,
"learning_rate": 1.1018518518518519e-05,
"loss": 0.3206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2734828293323517,
"step": 120,
"valid_targets_mean": 4552.7,
"valid_targets_min": 2314
},
{
"epoch": 0.2025931928687196,
"grad_norm": 0.8013266382776258,
"learning_rate": 1.1481481481481482e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34413567185401917,
"step": 125,
"valid_targets_mean": 3705.8,
"valid_targets_min": 1327
},
{
"epoch": 0.2106969205834684,
"grad_norm": 0.6573462845572078,
"learning_rate": 1.1944444444444444e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3564257323741913,
"step": 130,
"valid_targets_mean": 5756.6,
"valid_targets_min": 1527
},
{
"epoch": 0.2188006482982172,
"grad_norm": 0.6145775154410387,
"learning_rate": 1.2407407407407408e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2915225625038147,
"step": 135,
"valid_targets_mean": 4130.4,
"valid_targets_min": 2179
},
{
"epoch": 0.22690437601296595,
"grad_norm": 0.6299790820533513,
"learning_rate": 1.2870370370370371e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35333144664764404,
"step": 140,
"valid_targets_mean": 4053.9,
"valid_targets_min": 1936
},
{
"epoch": 0.23500810372771475,
"grad_norm": 0.5798870208280786,
"learning_rate": 1.3333333333333333e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2676125466823578,
"step": 145,
"valid_targets_mean": 4628.5,
"valid_targets_min": 640
},
{
"epoch": 0.24311183144246354,
"grad_norm": 0.7204824013564382,
"learning_rate": 1.3796296296296297e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32080602645874023,
"step": 150,
"valid_targets_mean": 4789.8,
"valid_targets_min": 2557
},
{
"epoch": 0.25121555915721233,
"grad_norm": 0.5701902969082061,
"learning_rate": 1.4259259259259259e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2823035717010498,
"step": 155,
"valid_targets_mean": 4539.7,
"valid_targets_min": 1340
},
{
"epoch": 0.2593192868719611,
"grad_norm": 0.672412353901392,
"learning_rate": 1.4722222222222224e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31722885370254517,
"step": 160,
"valid_targets_mean": 3801.2,
"valid_targets_min": 1484
},
{
"epoch": 0.26742301458670986,
"grad_norm": 0.6055091876647029,
"learning_rate": 1.5185185185185187e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289315789937973,
"step": 165,
"valid_targets_mean": 4378.0,
"valid_targets_min": 1423
},
{
"epoch": 0.2755267423014587,
"grad_norm": 0.5986947151887498,
"learning_rate": 1.564814814814815e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2713383138179779,
"step": 170,
"valid_targets_mean": 4662.1,
"valid_targets_min": 774
},
{
"epoch": 0.28363047001620745,
"grad_norm": 0.589272512044107,
"learning_rate": 1.6111111111111115e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23535937070846558,
"step": 175,
"valid_targets_mean": 4591.1,
"valid_targets_min": 1438
},
{
"epoch": 0.2917341977309562,
"grad_norm": 0.6642075943919709,
"learning_rate": 1.6574074074074075e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3774803876876831,
"step": 180,
"valid_targets_mean": 4475.9,
"valid_targets_min": 1154
},
{
"epoch": 0.29983792544570503,
"grad_norm": 0.5268979191410055,
"learning_rate": 1.7037037037037038e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2813992500305176,
"step": 185,
"valid_targets_mean": 5149.6,
"valid_targets_min": 1851
},
{
"epoch": 0.3079416531604538,
"grad_norm": 0.570391651488006,
"learning_rate": 1.7500000000000002e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2881418764591217,
"step": 190,
"valid_targets_mean": 5290.5,
"valid_targets_min": 1412
},
{
"epoch": 0.3160453808752026,
"grad_norm": 0.6322213174821355,
"learning_rate": 1.7962962962962965e-05,
"loss": 0.2729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086417317390442,
"step": 195,
"valid_targets_mean": 4418.4,
"valid_targets_min": 1260
},
{
"epoch": 0.3241491085899514,
"grad_norm": 0.6750293354196638,
"learning_rate": 1.8425925925925926e-05,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000980615615845,
"step": 200,
"valid_targets_mean": 3632.8,
"valid_targets_min": 1405
},
{
"epoch": 0.33225283630470015,
"grad_norm": 0.5598256550566737,
"learning_rate": 1.888888888888889e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009907007217407,
"step": 205,
"valid_targets_mean": 4531.7,
"valid_targets_min": 372
},
{
"epoch": 0.34035656401944897,
"grad_norm": 0.6410032816153864,
"learning_rate": 1.9351851851851853e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23578113317489624,
"step": 210,
"valid_targets_mean": 3848.1,
"valid_targets_min": 1328
},
{
"epoch": 0.34846029173419774,
"grad_norm": 0.670577961345641,
"learning_rate": 1.9814814814814816e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26014572381973267,
"step": 215,
"valid_targets_mean": 3549.2,
"valid_targets_min": 1323
},
{
"epoch": 0.3565640194489465,
"grad_norm": 0.5542778499650366,
"learning_rate": 2.027777777777778e-05,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911411225795746,
"step": 220,
"valid_targets_mean": 6411.4,
"valid_targets_min": 1036
},
{
"epoch": 0.3646677471636953,
"grad_norm": 0.5687749934223739,
"learning_rate": 2.074074074074074e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2129267156124115,
"step": 225,
"valid_targets_mean": 4360.8,
"valid_targets_min": 1473
},
{
"epoch": 0.3727714748784441,
"grad_norm": 0.545745675422607,
"learning_rate": 2.1203703703703703e-05,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25986871123313904,
"step": 230,
"valid_targets_mean": 4436.2,
"valid_targets_min": 1362
},
{
"epoch": 0.38087520259319285,
"grad_norm": 0.5149796037209613,
"learning_rate": 2.1666666666666667e-05,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23290029168128967,
"step": 235,
"valid_targets_mean": 5435.3,
"valid_targets_min": 1451
},
{
"epoch": 0.3889789303079417,
"grad_norm": 0.6133182407650534,
"learning_rate": 2.212962962962963e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26056742668151855,
"step": 240,
"valid_targets_mean": 4159.4,
"valid_targets_min": 1314
},
{
"epoch": 0.39708265802269044,
"grad_norm": 0.5649078331736651,
"learning_rate": 2.2592592592592594e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821381092071533,
"step": 245,
"valid_targets_mean": 4649.4,
"valid_targets_min": 1490
},
{
"epoch": 0.4051863857374392,
"grad_norm": 0.6118904964971021,
"learning_rate": 2.3055555555555554e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3021799921989441,
"step": 250,
"valid_targets_mean": 5177.1,
"valid_targets_min": 1482
},
{
"epoch": 0.413290113452188,
"grad_norm": 0.6071615375178763,
"learning_rate": 2.3518518518518518e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19076423346996307,
"step": 255,
"valid_targets_mean": 4186.5,
"valid_targets_min": 1178
},
{
"epoch": 0.4213938411669368,
"grad_norm": 0.5991586523880158,
"learning_rate": 2.3981481481481485e-05,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2608402371406555,
"step": 260,
"valid_targets_mean": 3828.4,
"valid_targets_min": 914
},
{
"epoch": 0.42949756888168555,
"grad_norm": 0.6337407192018856,
"learning_rate": 2.444444444444445e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24443909525871277,
"step": 265,
"valid_targets_mean": 4669.5,
"valid_targets_min": 1387
},
{
"epoch": 0.4376012965964344,
"grad_norm": 0.6370177249174864,
"learning_rate": 2.4907407407407412e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23749151825904846,
"step": 270,
"valid_targets_mean": 3662.0,
"valid_targets_min": 1268
},
{
"epoch": 0.44570502431118314,
"grad_norm": 0.6685559577348903,
"learning_rate": 2.5370370370370375e-05,
"loss": 0.2526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22629933059215546,
"step": 275,
"valid_targets_mean": 3966.9,
"valid_targets_min": 1361
},
{
"epoch": 0.4538087520259319,
"grad_norm": 0.5774981883358449,
"learning_rate": 2.5833333333333336e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2319318950176239,
"step": 280,
"valid_targets_mean": 4366.3,
"valid_targets_min": 1123
},
{
"epoch": 0.4619124797406807,
"grad_norm": 0.639777977381849,
"learning_rate": 2.62962962962963e-05,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22607596218585968,
"step": 285,
"valid_targets_mean": 4010.4,
"valid_targets_min": 1034
},
{
"epoch": 0.4700162074554295,
"grad_norm": 0.5632527042212236,
"learning_rate": 2.6759259259259263e-05,
"loss": 0.2222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21673567593097687,
"step": 290,
"valid_targets_mean": 4221.4,
"valid_targets_min": 1426
},
{
"epoch": 0.47811993517017826,
"grad_norm": 0.641243133328366,
"learning_rate": 2.7222222222222226e-05,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21339434385299683,
"step": 295,
"valid_targets_mean": 3281.4,
"valid_targets_min": 862
},
{
"epoch": 0.4862236628849271,
"grad_norm": 0.5785904863633673,
"learning_rate": 2.768518518518519e-05,
"loss": 0.2401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2441210299730301,
"step": 300,
"valid_targets_mean": 5462.9,
"valid_targets_min": 1413
},
{
"epoch": 0.49432739059967584,
"grad_norm": 0.6186086113261662,
"learning_rate": 2.814814814814815e-05,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24510961771011353,
"step": 305,
"valid_targets_mean": 4120.8,
"valid_targets_min": 1337
},
{
"epoch": 0.5024311183144247,
"grad_norm": 0.7369432792730909,
"learning_rate": 2.8611111111111113e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22853118181228638,
"step": 310,
"valid_targets_mean": 3062.8,
"valid_targets_min": 582
},
{
"epoch": 0.5105348460291734,
"grad_norm": 0.5012959603011699,
"learning_rate": 2.9074074074074077e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.265197217464447,
"step": 315,
"valid_targets_mean": 4856.2,
"valid_targets_min": 1409
},
{
"epoch": 0.5186385737439222,
"grad_norm": 0.5881603988884309,
"learning_rate": 2.953703703703704e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24882851541042328,
"step": 320,
"valid_targets_mean": 4374.3,
"valid_targets_min": 1504
},
{
"epoch": 0.526742301458671,
"grad_norm": 0.5843683180477552,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3021346926689148,
"step": 325,
"valid_targets_mean": 4368.1,
"valid_targets_min": 849
},
{
"epoch": 0.5348460291734197,
"grad_norm": 0.5638995855114154,
"learning_rate": 3.0462962962962964e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310064136981964,
"step": 330,
"valid_targets_mean": 4034.5,
"valid_targets_min": 1392
},
{
"epoch": 0.5429497568881686,
"grad_norm": 0.6241796157785493,
"learning_rate": 3.092592592592593e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775031626224518,
"step": 335,
"valid_targets_mean": 4538.9,
"valid_targets_min": 1472
},
{
"epoch": 0.5510534846029174,
"grad_norm": 0.5986159843009783,
"learning_rate": 3.138888888888889e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2154683768749237,
"step": 340,
"valid_targets_mean": 4171.1,
"valid_targets_min": 1448
},
{
"epoch": 0.5591572123176661,
"grad_norm": 0.5678213186550801,
"learning_rate": 3.185185185185185e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21003559231758118,
"step": 345,
"valid_targets_mean": 4115.6,
"valid_targets_min": 1494
},
{
"epoch": 0.5672609400324149,
"grad_norm": 0.5000435710526403,
"learning_rate": 3.231481481481482e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21373742818832397,
"step": 350,
"valid_targets_mean": 5205.3,
"valid_targets_min": 1382
},
{
"epoch": 0.5753646677471637,
"grad_norm": 0.6182955908884262,
"learning_rate": 3.277777777777778e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23803135752677917,
"step": 355,
"valid_targets_mean": 3645.1,
"valid_targets_min": 1045
},
{
"epoch": 0.5834683954619124,
"grad_norm": 0.618571479862893,
"learning_rate": 3.3240740740740746e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19696547091007233,
"step": 360,
"valid_targets_mean": 4458.5,
"valid_targets_min": 1330
},
{
"epoch": 0.5915721231766613,
"grad_norm": 0.5044774531396774,
"learning_rate": 3.3703703703703706e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2560524344444275,
"step": 365,
"valid_targets_mean": 5364.7,
"valid_targets_min": 1432
},
{
"epoch": 0.5996758508914101,
"grad_norm": 0.4850915687468068,
"learning_rate": 3.4166666666666666e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22693286836147308,
"step": 370,
"valid_targets_mean": 5804.1,
"valid_targets_min": 1286
},
{
"epoch": 0.6077795786061588,
"grad_norm": 0.7767357031334243,
"learning_rate": 3.462962962962963e-05,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23934313654899597,
"step": 375,
"valid_targets_mean": 4335.7,
"valid_targets_min": 688
},
{
"epoch": 0.6158833063209076,
"grad_norm": 0.5297011414951764,
"learning_rate": 3.509259259259259e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2228357195854187,
"step": 380,
"valid_targets_mean": 4548.9,
"valid_targets_min": 616
},
{
"epoch": 0.6239870340356564,
"grad_norm": 0.5580892808180266,
"learning_rate": 3.555555555555555e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24209387600421906,
"step": 385,
"valid_targets_mean": 4770.1,
"valid_targets_min": 1486
},
{
"epoch": 0.6320907617504052,
"grad_norm": 0.5064875325748078,
"learning_rate": 3.601851851851852e-05,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24600476026535034,
"step": 390,
"valid_targets_mean": 4807.3,
"valid_targets_min": 1405
},
{
"epoch": 0.640194489465154,
"grad_norm": 0.8096595526534478,
"learning_rate": 3.648148148148149e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2103320062160492,
"step": 395,
"valid_targets_mean": 5441.9,
"valid_targets_min": 1376
},
{
"epoch": 0.6482982171799028,
"grad_norm": 0.527656122669523,
"learning_rate": 3.694444444444445e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21797297894954681,
"step": 400,
"valid_targets_mean": 4970.8,
"valid_targets_min": 1286
},
{
"epoch": 0.6564019448946515,
"grad_norm": 0.5353735139926096,
"learning_rate": 3.7407407407407414e-05,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2168428897857666,
"step": 405,
"valid_targets_mean": 4440.8,
"valid_targets_min": 1348
},
{
"epoch": 0.6645056726094003,
"grad_norm": 0.5014487865079957,
"learning_rate": 3.7870370370370374e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2826576828956604,
"step": 410,
"valid_targets_mean": 4816.1,
"valid_targets_min": 1489
},
{
"epoch": 0.6726094003241491,
"grad_norm": 0.5310106006676556,
"learning_rate": 3.833333333333334e-05,
"loss": 0.2236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22325406968593597,
"step": 415,
"valid_targets_mean": 4324.9,
"valid_targets_min": 1259
},
{
"epoch": 0.6807131280388979,
"grad_norm": 0.5631510976247105,
"learning_rate": 3.87962962962963e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2960614562034607,
"step": 420,
"valid_targets_mean": 4590.2,
"valid_targets_min": 714
},
{
"epoch": 0.6888168557536467,
"grad_norm": 0.5090391200220923,
"learning_rate": 3.925925925925926e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2151426374912262,
"step": 425,
"valid_targets_mean": 4842.5,
"valid_targets_min": 1187
},
{
"epoch": 0.6969205834683955,
"grad_norm": 0.49546560892471103,
"learning_rate": 3.972222222222223e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19332653284072876,
"step": 430,
"valid_targets_mean": 4583.8,
"valid_targets_min": 1348
},
{
"epoch": 0.7050243111831442,
"grad_norm": 0.426580811573209,
"learning_rate": 3.99999738705324e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22979189455509186,
"step": 435,
"valid_targets_mean": 6008.7,
"valid_targets_min": 2062
},
{
"epoch": 0.713128038897893,
"grad_norm": 0.5296107565627104,
"learning_rate": 3.999967991480598e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2161000519990921,
"step": 440,
"valid_targets_mean": 4431.4,
"valid_targets_min": 1459
},
{
"epoch": 0.7212317666126418,
"grad_norm": 0.5911774054449865,
"learning_rate": 3.99990593463352e-05,
"loss": 0.2061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20900100469589233,
"step": 445,
"valid_targets_mean": 3832.8,
"valid_targets_min": 1421
},
{
"epoch": 0.7293354943273906,
"grad_norm": 0.50964362931027,
"learning_rate": 3.9998112175254504e-05,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19737258553504944,
"step": 450,
"valid_targets_mean": 4713.8,
"valid_targets_min": 1330
},
{
"epoch": 0.7374392220421394,
"grad_norm": 0.6532159249673581,
"learning_rate": 3.9996838417032044e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929355263710022,
"step": 455,
"valid_targets_mean": 3942.9,
"valid_targets_min": 845
},
{
"epoch": 0.7455429497568882,
"grad_norm": 0.4928978484161786,
"learning_rate": 3.999523809246943e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20819595456123352,
"step": 460,
"valid_targets_mean": 5082.1,
"valid_targets_min": 1540
},
{
"epoch": 0.7536466774716369,
"grad_norm": 0.5236619156041604,
"learning_rate": 3.9993311227701415e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2349873036146164,
"step": 465,
"valid_targets_mean": 4213.9,
"valid_targets_min": 1406
},
{
"epoch": 0.7617504051863857,
"grad_norm": 0.603508775726922,
"learning_rate": 3.9991057854195424e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2348279356956482,
"step": 470,
"valid_targets_mean": 4291.8,
"valid_targets_min": 1307
},
{
"epoch": 0.7698541329011345,
"grad_norm": 0.5979704039956626,
"learning_rate": 3.998847800875107e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2371644824743271,
"step": 475,
"valid_targets_mean": 5716.9,
"valid_targets_min": 2081
},
{
"epoch": 0.7779578606158833,
"grad_norm": 0.5663750794625397,
"learning_rate": 3.9985571733499544e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16969016194343567,
"step": 480,
"valid_targets_mean": 3593.6,
"valid_targets_min": 1369
},
{
"epoch": 0.7860615883306321,
"grad_norm": 0.465204031907573,
"learning_rate": 3.998233907590294e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22521032392978668,
"step": 485,
"valid_targets_mean": 5773.2,
"valid_targets_min": 2696
},
{
"epoch": 0.7941653160453809,
"grad_norm": 0.5166936419430709,
"learning_rate": 3.9978780088753464e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1836811602115631,
"step": 490,
"valid_targets_mean": 4100.2,
"valid_targets_min": 1392
},
{
"epoch": 0.8022690437601296,
"grad_norm": 0.5850448684229496,
"learning_rate": 3.997489483017256e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23051467537879944,
"step": 495,
"valid_targets_mean": 4196.2,
"valid_targets_min": 1467
},
{
"epoch": 0.8103727714748784,
"grad_norm": 0.5313568085982785,
"learning_rate": 3.997068336361e-05,
"loss": 0.2322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501906752586365,
"step": 500,
"valid_targets_mean": 5268.7,
"valid_targets_min": 1424
},
{
"epoch": 0.8184764991896273,
"grad_norm": 0.45876391274602263,
"learning_rate": 3.996614575784282e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22189603745937347,
"step": 505,
"valid_targets_mean": 5229.9,
"valid_targets_min": 1133
},
{
"epoch": 0.826580226904376,
"grad_norm": 0.5204098853244463,
"learning_rate": 3.99612820869742e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2431417852640152,
"step": 510,
"valid_targets_mean": 5087.5,
"valid_targets_min": 773
},
{
"epoch": 0.8346839546191248,
"grad_norm": 0.5515103680701857,
"learning_rate": 3.9956092430432254e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23825669288635254,
"step": 515,
"valid_targets_mean": 3682.3,
"valid_targets_min": 1074
},
{
"epoch": 0.8427876823338736,
"grad_norm": 0.49756644817448453,
"learning_rate": 3.9950576872968735e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24041366577148438,
"step": 520,
"valid_targets_mean": 4797.9,
"valid_targets_min": 1445
},
{
"epoch": 0.8508914100486223,
"grad_norm": 0.8994165287630641,
"learning_rate": 3.994473550465765e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22890087962150574,
"step": 525,
"valid_targets_mean": 5103.2,
"valid_targets_min": 1313
},
{
"epoch": 0.8589951377633711,
"grad_norm": 0.5108141443277746,
"learning_rate": 3.993856842089379e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22940672934055328,
"step": 530,
"valid_targets_mean": 5652.1,
"valid_targets_min": 2424
},
{
"epoch": 0.86709886547812,
"grad_norm": 0.5765103616276643,
"learning_rate": 3.99320757223912e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2153976708650589,
"step": 535,
"valid_targets_mean": 3130.8,
"valid_targets_min": 1286
},
{
"epoch": 0.8752025931928687,
"grad_norm": 0.5299043761506195,
"learning_rate": 3.992525751518144e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21200573444366455,
"step": 540,
"valid_targets_mean": 4073.6,
"valid_targets_min": 1365
},
{
"epoch": 0.8833063209076175,
"grad_norm": 0.6103411854134536,
"learning_rate": 3.991811391061199e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25960564613342285,
"step": 545,
"valid_targets_mean": 5217.1,
"valid_targets_min": 1356
},
{
"epoch": 0.8914100486223663,
"grad_norm": 0.5389982825030214,
"learning_rate": 3.9910645025344324e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22821247577667236,
"step": 550,
"valid_targets_mean": 5121.3,
"valid_targets_min": 1157
},
{
"epoch": 0.899513776337115,
"grad_norm": 0.5148328941205473,
"learning_rate": 3.990285098135204e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20730610191822052,
"step": 555,
"valid_targets_mean": 4166.3,
"valid_targets_min": 1343
},
{
"epoch": 0.9076175040518638,
"grad_norm": 0.4440249881059827,
"learning_rate": 3.98947319059189e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2121986448764801,
"step": 560,
"valid_targets_mean": 5257.2,
"valid_targets_min": 2014
},
{
"epoch": 0.9157212317666127,
"grad_norm": 0.5427347682275363,
"learning_rate": 3.988628793163669e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2212689220905304,
"step": 565,
"valid_targets_mean": 4286.0,
"valid_targets_min": 1240
},
{
"epoch": 0.9238249594813615,
"grad_norm": 0.4810450530247738,
"learning_rate": 3.987751919640309e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2069002389907837,
"step": 570,
"valid_targets_mean": 4115.8,
"valid_targets_min": 2249
},
{
"epoch": 0.9319286871961102,
"grad_norm": 0.4785049236515675,
"learning_rate": 3.9868425843419445e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22010046243667603,
"step": 575,
"valid_targets_mean": 4391.6,
"valid_targets_min": 1467
},
{
"epoch": 0.940032414910859,
"grad_norm": 0.5830524896993419,
"learning_rate": 3.985900802118836e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29115572571754456,
"step": 580,
"valid_targets_mean": 5825.9,
"valid_targets_min": 1375
},
{
"epoch": 0.9481361426256077,
"grad_norm": 0.5392327750650897,
"learning_rate": 3.984926588351135e-05,
"loss": 0.2435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22419336438179016,
"step": 585,
"valid_targets_mean": 4182.1,
"valid_targets_min": 1327
},
{
"epoch": 0.9562398703403565,
"grad_norm": 0.5044623427949209,
"learning_rate": 3.983919958948627e-05,
"loss": 0.2206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18491308391094208,
"step": 590,
"valid_targets_mean": 4006.9,
"valid_targets_min": 1321
},
{
"epoch": 0.9643435980551054,
"grad_norm": 0.4986732430556064,
"learning_rate": 3.982880930350474e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21416428685188293,
"step": 595,
"valid_targets_mean": 4211.7,
"valid_targets_min": 1441
},
{
"epoch": 0.9724473257698542,
"grad_norm": 0.5124109728076002,
"learning_rate": 3.981809519524948e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23443514108657837,
"step": 600,
"valid_targets_mean": 4845.2,
"valid_targets_min": 1626
},
{
"epoch": 0.9805510534846029,
"grad_norm": 0.47347249636382777,
"learning_rate": 3.98070574396915e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23536278307437897,
"step": 605,
"valid_targets_mean": 4644.9,
"valid_targets_min": 560
},
{
"epoch": 0.9886547811993517,
"grad_norm": 0.4741985537892797,
"learning_rate": 3.979569621708727e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21886685490608215,
"step": 610,
"valid_targets_mean": 4478.0,
"valid_targets_min": 1523
},
{
"epoch": 0.9967585089141004,
"grad_norm": 0.5974210354480042,
"learning_rate": 3.978401171297576e-05,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20954114198684692,
"step": 615,
"valid_targets_mean": 3642.8,
"valid_targets_min": 1394
},
{
"epoch": 1.0048622366288493,
"grad_norm": 0.5273995541794072,
"learning_rate": 3.9772004118175424e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2294274866580963,
"step": 620,
"valid_targets_mean": 4028.8,
"valid_targets_min": 1114
},
{
"epoch": 1.012965964343598,
"grad_norm": 0.5089306423895958,
"learning_rate": 3.975967362878106e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1963168829679489,
"step": 625,
"valid_targets_mean": 4406.2,
"valid_targets_min": 1467
},
{
"epoch": 1.0210696920583469,
"grad_norm": 0.6148003496273449,
"learning_rate": 3.9747020446160665e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2061430662870407,
"step": 630,
"valid_targets_mean": 4103.2,
"valid_targets_min": 2163
},
{
"epoch": 1.0291734197730957,
"grad_norm": 0.5805488016124426,
"learning_rate": 3.973404477695207e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21570029854774475,
"step": 635,
"valid_targets_mean": 4837.1,
"valid_targets_min": 1372
},
{
"epoch": 1.0372771474878444,
"grad_norm": 0.5200072266673288,
"learning_rate": 3.972074683305961e-05,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21892379224300385,
"step": 640,
"valid_targets_mean": 4104.2,
"valid_targets_min": 1333
},
{
"epoch": 1.0453808752025933,
"grad_norm": 0.5120591679389618,
"learning_rate": 3.970712683165066e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15413756668567657,
"step": 645,
"valid_targets_mean": 3574.6,
"valid_targets_min": 1450
},
{
"epoch": 1.053484602917342,
"grad_norm": 0.4986729646028235,
"learning_rate": 3.969318499515208e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21150606870651245,
"step": 650,
"valid_targets_mean": 4572.9,
"valid_targets_min": 1004
},
{
"epoch": 1.0615883306320908,
"grad_norm": 0.4619514783129513,
"learning_rate": 3.967892155124659e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18860788643360138,
"step": 655,
"valid_targets_mean": 4465.8,
"valid_targets_min": 774
},
{
"epoch": 1.0696920583468394,
"grad_norm": 0.45418605837420345,
"learning_rate": 3.9664336732869044e-05,
"loss": 0.2191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19863459467887878,
"step": 660,
"valid_targets_mean": 4744.1,
"valid_targets_min": 1465
},
{
"epoch": 1.0777957860615883,
"grad_norm": 0.4863876337461995,
"learning_rate": 3.964943077820263e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24863094091415405,
"step": 665,
"valid_targets_mean": 5111.7,
"valid_targets_min": 1074
},
{
"epoch": 1.0858995137763372,
"grad_norm": 0.4769229701415419,
"learning_rate": 3.963420393067499e-05,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24888065457344055,
"step": 670,
"valid_targets_mean": 4371.7,
"valid_targets_min": 1409
},
{
"epoch": 1.0940032414910859,
"grad_norm": 0.5516196801331024,
"learning_rate": 3.961865643895422e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16257669031620026,
"step": 675,
"valid_targets_mean": 3767.6,
"valid_targets_min": 1354
},
{
"epoch": 1.1021069692058347,
"grad_norm": 0.6012761309137233,
"learning_rate": 3.960278855694484e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20597979426383972,
"step": 680,
"valid_targets_mean": 3221.5,
"valid_targets_min": 459
},
{
"epoch": 1.1102106969205834,
"grad_norm": 0.5394070740857165,
"learning_rate": 3.958660054378361e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23972061276435852,
"step": 685,
"valid_targets_mean": 4129.9,
"valid_targets_min": 1312
},
{
"epoch": 1.1183144246353323,
"grad_norm": 0.6116321809309343,
"learning_rate": 3.9570092663835334e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856822669506073,
"step": 690,
"valid_targets_mean": 4818.4,
"valid_targets_min": 1146
},
{
"epoch": 1.1264181523500811,
"grad_norm": 0.44563993029204846,
"learning_rate": 3.9553265186688525e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21733355522155762,
"step": 695,
"valid_targets_mean": 5456.4,
"valid_targets_min": 1418
},
{
"epoch": 1.1345218800648298,
"grad_norm": 0.5097046093454173,
"learning_rate": 3.953611838715101e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18223533034324646,
"step": 700,
"valid_targets_mean": 5043.8,
"valid_targets_min": 1353
},
{
"epoch": 1.1426256077795787,
"grad_norm": 0.4684279825286209,
"learning_rate": 3.951865254524542e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2561621069908142,
"step": 705,
"valid_targets_mean": 5526.7,
"valid_targets_min": 2616
},
{
"epoch": 1.1507293354943273,
"grad_norm": 0.4776014506859393,
"learning_rate": 3.950086794620467e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20872297883033752,
"step": 710,
"valid_targets_mean": 4848.7,
"valid_targets_min": 707
},
{
"epoch": 1.1588330632090762,
"grad_norm": 0.5021057874599553,
"learning_rate": 3.948276488046723e-05,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19527600705623627,
"step": 715,
"valid_targets_mean": 4283.8,
"valid_targets_min": 2009
},
{
"epoch": 1.1669367909238249,
"grad_norm": 0.516010687565433,
"learning_rate": 3.946434364367243e-05,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20048931241035461,
"step": 720,
"valid_targets_mean": 4517.3,
"valid_targets_min": 1286
},
{
"epoch": 1.1750405186385737,
"grad_norm": 0.4845283973803967,
"learning_rate": 3.9445604536655625e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18405257165431976,
"step": 725,
"valid_targets_mean": 3697.2,
"valid_targets_min": 1421
},
{
"epoch": 1.1831442463533226,
"grad_norm": 0.4974308404194371,
"learning_rate": 3.9426547865443264e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19134216010570526,
"step": 730,
"valid_targets_mean": 3739.6,
"valid_targets_min": 1313
},
{
"epoch": 1.1912479740680713,
"grad_norm": 0.4725179442958282,
"learning_rate": 3.940717394124792e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21701499819755554,
"step": 735,
"valid_targets_mean": 5500.9,
"valid_targets_min": 2302
},
{
"epoch": 1.1993517017828201,
"grad_norm": 0.4966790424314751,
"learning_rate": 3.938748308046318e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2208487093448639,
"step": 740,
"valid_targets_mean": 4056.9,
"valid_targets_min": 1194
},
{
"epoch": 1.2074554294975688,
"grad_norm": 0.44190871443509405,
"learning_rate": 3.9367475604658485e-05,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22573363780975342,
"step": 745,
"valid_targets_mean": 4984.1,
"valid_targets_min": 628
},
{
"epoch": 1.2155591572123177,
"grad_norm": 0.4969917236201204,
"learning_rate": 3.9347151840573915e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2162916660308838,
"step": 750,
"valid_targets_mean": 3742.9,
"valid_targets_min": 1585
},
{
"epoch": 1.2236628849270665,
"grad_norm": 0.49509015258174144,
"learning_rate": 3.932651212011479e-05,
"loss": 0.1949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18598730862140656,
"step": 755,
"valid_targets_mean": 4200.9,
"valid_targets_min": 1582
},
{
"epoch": 1.2317666126418152,
"grad_norm": 0.43884225031680624,
"learning_rate": 3.930555678034628e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21229609847068787,
"step": 760,
"valid_targets_mean": 4642.7,
"valid_targets_min": 1069
},
{
"epoch": 1.239870340356564,
"grad_norm": 0.5122574928153316,
"learning_rate": 3.9284286163487924e-05,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1989661157131195,
"step": 765,
"valid_targets_mean": 4026.2,
"valid_targets_min": 1399
},
{
"epoch": 1.2479740680713127,
"grad_norm": 0.5134191353676413,
"learning_rate": 3.9262700616908006e-05,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.239942729473114,
"step": 770,
"valid_targets_mean": 4500.2,
"valid_targets_min": 1423
},
{
"epoch": 1.2560777957860616,
"grad_norm": 0.458384033906824,
"learning_rate": 3.924080049311791e-05,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18945372104644775,
"step": 775,
"valid_targets_mean": 4252.0,
"valid_targets_min": 1361
},
{
"epoch": 1.2641815235008105,
"grad_norm": 0.42458575412199884,
"learning_rate": 3.921858614976632e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20727957785129547,
"step": 780,
"valid_targets_mean": 5022.1,
"valid_targets_min": 2198
},
{
"epoch": 1.2722852512155591,
"grad_norm": 0.51192900661981,
"learning_rate": 3.919605794963343e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18662604689598083,
"step": 785,
"valid_targets_mean": 3851.8,
"valid_targets_min": 1488
},
{
"epoch": 1.280388978930308,
"grad_norm": 0.4668022934402429,
"learning_rate": 3.9173216260624994e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19831231236457825,
"step": 790,
"valid_targets_mean": 3995.3,
"valid_targets_min": 1467
},
{
"epoch": 1.2884927066450567,
"grad_norm": 0.4703228446731573,
"learning_rate": 3.915006145576632e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17850956320762634,
"step": 795,
"valid_targets_mean": 4885.1,
"valid_targets_min": 1423
},
{
"epoch": 1.2965964343598055,
"grad_norm": 0.5125676461591195,
"learning_rate": 3.912659391319617e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16043990850448608,
"step": 800,
"valid_targets_mean": 3561.5,
"valid_targets_min": 1361
},
{
"epoch": 1.3047001620745542,
"grad_norm": 0.43433575074873904,
"learning_rate": 3.910281401616061e-05,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17930254340171814,
"step": 805,
"valid_targets_mean": 4081.4,
"valid_targets_min": 1332
},
{
"epoch": 1.312803889789303,
"grad_norm": 0.42220097462239276,
"learning_rate": 3.907872215300672e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16810905933380127,
"step": 810,
"valid_targets_mean": 3859.5,
"valid_targets_min": 1351
},
{
"epoch": 1.320907617504052,
"grad_norm": 0.426999664447986,
"learning_rate": 3.905431871717628e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19243112206459045,
"step": 815,
"valid_targets_mean": 4594.4,
"valid_targets_min": 1473
},
{
"epoch": 1.3290113452188006,
"grad_norm": 0.5021614931496107,
"learning_rate": 3.902960410719931e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.242889404296875,
"step": 820,
"valid_targets_mean": 3985.9,
"valid_targets_min": 1472
},
{
"epoch": 1.3371150729335495,
"grad_norm": 0.46392047570045136,
"learning_rate": 3.900457872668763e-05,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1502235233783722,
"step": 825,
"valid_targets_mean": 3738.2,
"valid_targets_min": 1018
},
{
"epoch": 1.3452188006482984,
"grad_norm": 0.4118848660851366,
"learning_rate": 3.897924298432816e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2182319462299347,
"step": 830,
"valid_targets_mean": 5490.6,
"valid_targets_min": 2289
},
{
"epoch": 1.353322528363047,
"grad_norm": 0.4280305041940191,
"learning_rate": 3.895359729387636e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21427130699157715,
"step": 835,
"valid_targets_mean": 4321.1,
"valid_targets_min": 1300
},
{
"epoch": 1.3614262560777957,
"grad_norm": 0.46406432789212704,
"learning_rate": 3.892764207414939e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19561821222305298,
"step": 840,
"valid_targets_mean": 4353.8,
"valid_targets_min": 1442
},
{
"epoch": 1.3695299837925445,
"grad_norm": 0.4179681529478451,
"learning_rate": 3.890137774901931e-05,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21955807507038116,
"step": 845,
"valid_targets_mean": 5324.8,
"valid_targets_min": 2282
},
{
"epoch": 1.3776337115072934,
"grad_norm": 0.48683442708968644,
"learning_rate": 3.887480474740616e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.204122394323349,
"step": 850,
"valid_targets_mean": 4110.2,
"valid_targets_min": 970
},
{
"epoch": 1.385737439222042,
"grad_norm": 0.42361528043877883,
"learning_rate": 3.8847923503270915e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18733659386634827,
"step": 855,
"valid_targets_mean": 4214.3,
"valid_targets_min": 1427
},
{
"epoch": 1.393841166936791,
"grad_norm": 0.4732297962200014,
"learning_rate": 3.8820734455608464e-05,
"loss": 0.1971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19635385274887085,
"step": 860,
"valid_targets_mean": 3787.2,
"valid_targets_min": 1393
},
{
"epoch": 1.4019448946515398,
"grad_norm": 0.4337879170512228,
"learning_rate": 3.879323804844038e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2074633687734604,
"step": 865,
"valid_targets_mean": 4273.1,
"valid_targets_min": 1281
},
{
"epoch": 1.4100486223662885,
"grad_norm": 0.4808999534174423,
"learning_rate": 3.876543473080771e-05,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.243323415517807,
"step": 870,
"valid_targets_mean": 4553.7,
"valid_targets_min": 1448
},
{
"epoch": 1.4181523500810373,
"grad_norm": 0.43158317153388576,
"learning_rate": 3.87373249567636e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18346458673477173,
"step": 875,
"valid_targets_mean": 4949.8,
"valid_targets_min": 2071
},
{
"epoch": 1.426256077795786,
"grad_norm": 0.5068184567977475,
"learning_rate": 3.870890918536592e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1928868591785431,
"step": 880,
"valid_targets_mean": 4209.9,
"valid_targets_min": 1343
},
{
"epoch": 1.4343598055105349,
"grad_norm": 0.47287026057995374,
"learning_rate": 3.8680187880669765e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18420298397541046,
"step": 885,
"valid_targets_mean": 3873.4,
"valid_targets_min": 1356
},
{
"epoch": 1.4424635332252835,
"grad_norm": 0.43700819097301596,
"learning_rate": 3.865116151171983e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.164870485663414,
"step": 890,
"valid_targets_mean": 3684.1,
"valid_targets_min": 1318
},
{
"epoch": 1.4505672609400324,
"grad_norm": 0.47511708443362843,
"learning_rate": 3.8621830552542826e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17125675082206726,
"step": 895,
"valid_targets_mean": 3790.2,
"valid_targets_min": 1358
},
{
"epoch": 1.4586709886547813,
"grad_norm": 0.4709799341765991,
"learning_rate": 3.859219548213965e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19907286763191223,
"step": 900,
"valid_targets_mean": 3615.4,
"valid_targets_min": 1886
},
{
"epoch": 1.46677471636953,
"grad_norm": 0.45038440332952534,
"learning_rate": 3.856225678447764e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19604134559631348,
"step": 905,
"valid_targets_mean": 3964.0,
"valid_targets_min": 1365
},
{
"epoch": 1.4748784440842788,
"grad_norm": 0.4239032241495173,
"learning_rate": 3.853201494848263e-05,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17849305272102356,
"step": 910,
"valid_targets_mean": 4116.5,
"valid_targets_min": 736
},
{
"epoch": 1.4829821717990275,
"grad_norm": 0.44353633252428387,
"learning_rate": 3.8501470468030984e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1747392863035202,
"step": 915,
"valid_targets_mean": 4118.1,
"valid_targets_min": 1576
},
{
"epoch": 1.4910858995137763,
"grad_norm": 0.47312911378928535,
"learning_rate": 3.84706238419415e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21894387900829315,
"step": 920,
"valid_targets_mean": 4172.2,
"valid_targets_min": 1400
},
{
"epoch": 1.499189627228525,
"grad_norm": 0.4761430342519301,
"learning_rate": 3.8439475573967315e-05,
"loss": 0.1981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18914563953876495,
"step": 925,
"valid_targets_mean": 3912.1,
"valid_targets_min": 640
},
{
"epoch": 1.5072933549432739,
"grad_norm": 0.43698775643113397,
"learning_rate": 3.840802617278763e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2051890343427658,
"step": 930,
"valid_targets_mean": 4464.6,
"valid_targets_min": 1484
},
{
"epoch": 1.5153970826580228,
"grad_norm": 0.40937497215437296,
"learning_rate": 3.837627615199942e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21246007084846497,
"step": 935,
"valid_targets_mean": 5861.9,
"valid_targets_min": 1433
},
{
"epoch": 1.5235008103727714,
"grad_norm": 0.4612933987642411,
"learning_rate": 3.834422603010906e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1685883104801178,
"step": 940,
"valid_targets_mean": 3331.0,
"valid_targets_min": 952
},
{
"epoch": 1.5316045380875203,
"grad_norm": 0.44748181235308926,
"learning_rate": 3.831187633052384e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18851560354232788,
"step": 945,
"valid_targets_mean": 4319.6,
"valid_targets_min": 1497
},
{
"epoch": 1.5397082658022692,
"grad_norm": 0.4645741670739686,
"learning_rate": 3.8279227581543424e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17598797380924225,
"step": 950,
"valid_targets_mean": 3860.6,
"valid_targets_min": 1325
},
{
"epoch": 1.5478119935170178,
"grad_norm": 0.4446178110855918,
"learning_rate": 3.824628031635122e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20480293035507202,
"step": 955,
"valid_targets_mean": 5071.1,
"valid_targets_min": 1335
},
{
"epoch": 1.5559157212317665,
"grad_norm": 0.43176875691929406,
"learning_rate": 3.8213035073005665e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.195458322763443,
"step": 960,
"valid_targets_mean": 4873.1,
"valid_targets_min": 1731
},
{
"epoch": 1.5640194489465153,
"grad_norm": 0.4443525213532384,
"learning_rate": 3.817949239443147e-05,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20885604619979858,
"step": 965,
"valid_targets_mean": 4482.3,
"valid_targets_min": 2171
},
{
"epoch": 1.5721231766612642,
"grad_norm": 0.39045971509248545,
"learning_rate": 3.814565282841071e-05,
"loss": 0.1709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18435224890708923,
"step": 970,
"valid_targets_mean": 4966.6,
"valid_targets_min": 1448
},
{
"epoch": 1.5802269043760129,
"grad_norm": 0.42154294945737253,
"learning_rate": 3.81115169275739e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14854902029037476,
"step": 975,
"valid_targets_mean": 3888.8,
"valid_targets_min": 1378
},
{
"epoch": 1.5883306320907618,
"grad_norm": 0.42988574528808304,
"learning_rate": 3.8077085249390997e-05,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2115168422460556,
"step": 980,
"valid_targets_mean": 4769.3,
"valid_targets_min": 1112
},
{
"epoch": 1.5964343598055106,
"grad_norm": 0.40490899317079226,
"learning_rate": 3.8042358356162215e-05,
"loss": 0.1967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20156720280647278,
"step": 985,
"valid_targets_mean": 4670.4,
"valid_targets_min": 1184
},
{
"epoch": 1.6045380875202593,
"grad_norm": 0.3933960356420022,
"learning_rate": 3.8007336815008945e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1848571002483368,
"step": 990,
"valid_targets_mean": 4553.4,
"valid_targets_min": 1393
},
{
"epoch": 1.6126418152350082,
"grad_norm": 0.425722007437382,
"learning_rate": 3.797202119786442e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1796191930770874,
"step": 995,
"valid_targets_mean": 4485.4,
"valid_targets_min": 1558
},
{
"epoch": 1.620745542949757,
"grad_norm": 0.38964048320391237,
"learning_rate": 3.79364120814644e-05,
"loss": 0.2208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22639715671539307,
"step": 1000,
"valid_targets_mean": 5330.9,
"valid_targets_min": 1302
},
{
"epoch": 1.6288492706645057,
"grad_norm": 0.41626273486480475,
"learning_rate": 3.790051004733775e-05,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2120615541934967,
"step": 1005,
"valid_targets_mean": 5283.8,
"valid_targets_min": 1492
},
{
"epoch": 1.6369529983792543,
"grad_norm": 0.5147342689508975,
"learning_rate": 3.786431568179697e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20870164036750793,
"step": 1010,
"valid_targets_mean": 4583.5,
"valid_targets_min": 1383
},
{
"epoch": 1.6450567260940032,
"grad_norm": 0.440817874619879,
"learning_rate": 3.7827829575928536e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18191151320934296,
"step": 1015,
"valid_targets_mean": 3649.4,
"valid_targets_min": 1358
},
{
"epoch": 1.653160453808752,
"grad_norm": 0.472655029247844,
"learning_rate": 3.779105232558337e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25538885593414307,
"step": 1020,
"valid_targets_mean": 6181.6,
"valid_targets_min": 1234
},
{
"epoch": 1.6612641815235007,
"grad_norm": 0.4216306868266021,
"learning_rate": 3.775398453136701e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17359581589698792,
"step": 1025,
"valid_targets_mean": 3975.2,
"valid_targets_min": 736
},
{
"epoch": 1.6693679092382496,
"grad_norm": 0.39959055016658535,
"learning_rate": 3.771662679862984e-05,
"loss": 0.2012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18280324339866638,
"step": 1030,
"valid_targets_mean": 4821.5,
"valid_targets_min": 2264
},
{
"epoch": 1.6774716369529985,
"grad_norm": 0.4438321730012118,
"learning_rate": 3.767897973745721e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20099571347236633,
"step": 1035,
"valid_targets_mean": 4090.6,
"valid_targets_min": 1036
},
{
"epoch": 1.6855753646677472,
"grad_norm": 0.4291135125758818,
"learning_rate": 3.764104396265946e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2137276828289032,
"step": 1040,
"valid_targets_mean": 4530.7,
"valid_targets_min": 1375
},
{
"epoch": 1.6936790923824958,
"grad_norm": 0.4440714946429937,
"learning_rate": 3.760282009376187e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20279011130332947,
"step": 1045,
"valid_targets_mean": 4290.0,
"valid_targets_min": 1269
},
{
"epoch": 1.7017828200972447,
"grad_norm": 0.46369261424562613,
"learning_rate": 3.756430875499458e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18480262160301208,
"step": 1050,
"valid_targets_mean": 3838.8,
"valid_targets_min": 1402
},
{
"epoch": 1.7098865478119936,
"grad_norm": 0.4092457788481106,
"learning_rate": 3.7525510575282354e-05,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22688287496566772,
"step": 1055,
"valid_targets_mean": 5638.9,
"valid_targets_min": 1159
},
{
"epoch": 1.7179902755267422,
"grad_norm": 0.512732774310131,
"learning_rate": 3.748642618823432e-05,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1761859655380249,
"step": 1060,
"valid_targets_mean": 3192.5,
"valid_targets_min": 862
},
{
"epoch": 1.726094003241491,
"grad_norm": 0.44671104737829626,
"learning_rate": 3.744705623213365e-05,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18772464990615845,
"step": 1065,
"valid_targets_mean": 3969.5,
"valid_targets_min": 1310
},
{
"epoch": 1.73419773095624,
"grad_norm": 0.43601883404552333,
"learning_rate": 3.74074013499271e-05,
"loss": 0.1994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2021428793668747,
"step": 1070,
"valid_targets_mean": 5082.8,
"valid_targets_min": 1369
},
{
"epoch": 1.7423014586709886,
"grad_norm": 0.421028623668563,
"learning_rate": 3.736746218921453e-05,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16165471076965332,
"step": 1075,
"valid_targets_mean": 4049.3,
"valid_targets_min": 1509
},
{
"epoch": 1.7504051863857373,
"grad_norm": 0.4333329574828141,
"learning_rate": 3.732723940223832e-05,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2255226969718933,
"step": 1080,
"valid_targets_mean": 4857.2,
"valid_targets_min": 2369
},
{
"epoch": 1.7585089141004864,
"grad_norm": 0.8093577300516263,
"learning_rate": 3.7286733645872726e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16192904114723206,
"step": 1085,
"valid_targets_mean": 3395.7,
"valid_targets_min": 1402
},
{
"epoch": 1.766612641815235,
"grad_norm": 0.4303236270123881,
"learning_rate": 3.724594558161315e-05,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886795163154602,
"step": 1090,
"valid_targets_mean": 4195.4,
"valid_targets_min": 1335
},
{
"epoch": 1.7747163695299837,
"grad_norm": 0.4271045023656605,
"learning_rate": 3.720487587556534e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22572541236877441,
"step": 1095,
"valid_targets_mean": 4628.6,
"valid_targets_min": 1527
},
{
"epoch": 1.7828200972447326,
"grad_norm": 0.4168865221240875,
"learning_rate": 3.716352519843448e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22260594367980957,
"step": 1100,
"valid_targets_mean": 5321.4,
"valid_targets_min": 1732
},
{
"epoch": 1.7909238249594814,
"grad_norm": 0.42384928589160936,
"learning_rate": 3.712189422551431e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18755793571472168,
"step": 1105,
"valid_targets_mean": 4328.8,
"valid_targets_min": 1434
},
{
"epoch": 1.79902755267423,
"grad_norm": 0.41646753010972154,
"learning_rate": 3.7079983636676005e-05,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20401719212532043,
"step": 1110,
"valid_targets_mean": 5051.8,
"valid_targets_min": 1410
},
{
"epoch": 1.807131280388979,
"grad_norm": 0.3813398032055785,
"learning_rate": 3.703779411635714e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1891724020242691,
"step": 1115,
"valid_targets_mean": 5103.3,
"valid_targets_min": 1392
},
{
"epoch": 1.8152350081037278,
"grad_norm": 0.46573526542742605,
"learning_rate": 3.6995326353550515e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17837417125701904,
"step": 1120,
"valid_targets_mean": 3876.1,
"valid_targets_min": 1297
},
{
"epoch": 1.8233387358184765,
"grad_norm": 0.4534625642159336,
"learning_rate": 3.695258104179284e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1509757936000824,
"step": 1125,
"valid_targets_mean": 3438.0,
"valid_targets_min": 1239
},
{
"epoch": 1.8314424635332252,
"grad_norm": 0.4506591558299602,
"learning_rate": 3.690955887915347e-05,
"loss": 0.1873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1877855360507965,
"step": 1130,
"valid_targets_mean": 4014.6,
"valid_targets_min": 1346
},
{
"epoch": 1.839546191247974,
"grad_norm": 0.4008424296471736,
"learning_rate": 3.686626056822298e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1591203808784485,
"step": 1135,
"valid_targets_mean": 4374.0,
"valid_targets_min": 1357
},
{
"epoch": 1.847649918962723,
"grad_norm": 0.43014942361797626,
"learning_rate": 3.682268681610169e-05,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21824797987937927,
"step": 1140,
"valid_targets_mean": 4494.2,
"valid_targets_min": 1408
},
{
"epoch": 1.8557536466774716,
"grad_norm": 0.42136818327229264,
"learning_rate": 3.677883833438814e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1907494217157364,
"step": 1145,
"valid_targets_mean": 4776.2,
"valid_targets_min": 1475
},
{
"epoch": 1.8638573743922204,
"grad_norm": 0.4412420739828771,
"learning_rate": 3.6734715839167427e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16720981895923615,
"step": 1150,
"valid_targets_mean": 3630.3,
"valid_targets_min": 1298
},
{
"epoch": 1.8719611021069693,
"grad_norm": 0.4415751980816361,
"learning_rate": 3.669032005099954e-05,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2498154640197754,
"step": 1155,
"valid_targets_mean": 5633.4,
"valid_targets_min": 1512
},
{
"epoch": 1.880064829821718,
"grad_norm": 0.40952145032072795,
"learning_rate": 3.664565169490761e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18677553534507751,
"step": 1160,
"valid_targets_mean": 4367.2,
"valid_targets_min": 1187
},
{
"epoch": 1.8881685575364666,
"grad_norm": 0.489258878774405,
"learning_rate": 3.660071150036602e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20160531997680664,
"step": 1165,
"valid_targets_mean": 4219.1,
"valid_targets_min": 1345
},
{
"epoch": 1.8962722852512157,
"grad_norm": 0.4525265915982652,
"learning_rate": 3.655550020128852e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606647312641144,
"step": 1170,
"valid_targets_mean": 4542.6,
"valid_targets_min": 1351
},
{
"epoch": 1.9043760129659644,
"grad_norm": 0.39049624581473075,
"learning_rate": 3.651001853601627e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17106109857559204,
"step": 1175,
"valid_targets_mean": 4377.2,
"valid_targets_min": 808
},
{
"epoch": 1.912479740680713,
"grad_norm": 0.39226733614625686,
"learning_rate": 3.646426724730572e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21923178434371948,
"step": 1180,
"valid_targets_mean": 4946.4,
"valid_targets_min": 1406
},
{
"epoch": 1.920583468395462,
"grad_norm": 0.3831318298196707,
"learning_rate": 3.641824708231653e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23360614478588104,
"step": 1185,
"valid_targets_mean": 6560.4,
"valid_targets_min": 2831
},
{
"epoch": 1.9286871961102108,
"grad_norm": 0.39667541079665347,
"learning_rate": 3.6371958792599346e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15785202383995056,
"step": 1190,
"valid_targets_mean": 4117.3,
"valid_targets_min": 1326
},
{
"epoch": 1.9367909238249594,
"grad_norm": 0.44441348853109325,
"learning_rate": 3.632540313408353e-05,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15401755273342133,
"step": 1195,
"valid_targets_mean": 3274.1,
"valid_targets_min": 1398
},
{
"epoch": 1.9448946515397083,
"grad_norm": 0.4016343317461078,
"learning_rate": 3.627858086706483e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17341655492782593,
"step": 1200,
"valid_targets_mean": 4483.2,
"valid_targets_min": 1306
},
{
"epoch": 1.9529983792544572,
"grad_norm": 0.39527315259402573,
"learning_rate": 3.6231492756192924e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22069337964057922,
"step": 1205,
"valid_targets_mean": 5291.3,
"valid_targets_min": 827
},
{
"epoch": 1.9611021069692058,
"grad_norm": 0.47431992205560747,
"learning_rate": 3.618413957045899e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19169411063194275,
"step": 1210,
"valid_targets_mean": 3384.5,
"valid_targets_min": 1366
},
{
"epoch": 1.9692058346839545,
"grad_norm": 0.42588976710081894,
"learning_rate": 3.6136522083183096e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1703414022922516,
"step": 1215,
"valid_targets_mean": 4210.9,
"valid_targets_min": 1380
},
{
"epoch": 1.9773095623987034,
"grad_norm": 0.3993131140715784,
"learning_rate": 3.608864107200159e-05,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21244439482688904,
"step": 1220,
"valid_targets_mean": 4543.6,
"valid_targets_min": 2047
},
{
"epoch": 1.9854132901134522,
"grad_norm": 0.4344328322329922,
"learning_rate": 3.604049731885442e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18995779752731323,
"step": 1225,
"valid_targets_mean": 4069.1,
"valid_targets_min": 1394
},
{
"epoch": 1.993517017828201,
"grad_norm": 0.4400446086567771,
"learning_rate": 3.599209160997234e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21253399550914764,
"step": 1230,
"valid_targets_mean": 4556.4,
"valid_targets_min": 1281
},
{
"epoch": 2.0016207455429496,
"grad_norm": 0.376589399977183,
"learning_rate": 3.594342473586406e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640516221523285,
"step": 1235,
"valid_targets_mean": 5084.4,
"valid_targets_min": 1255
},
{
"epoch": 2.0097244732576987,
"grad_norm": 0.48073326523872145,
"learning_rate": 3.589449749130337e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18342489004135132,
"step": 1240,
"valid_targets_mean": 3867.4,
"valid_targets_min": 1240
},
{
"epoch": 2.0178282009724473,
"grad_norm": 0.3727414184617058,
"learning_rate": 3.5845310675316134e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20190215110778809,
"step": 1245,
"valid_targets_mean": 5865.1,
"valid_targets_min": 1351
},
{
"epoch": 2.025931928687196,
"grad_norm": 0.4395786818226242,
"learning_rate": 3.5795865091167266e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18115079402923584,
"step": 1250,
"valid_targets_mean": 3741.1,
"valid_targets_min": 1344
},
{
"epoch": 2.034035656401945,
"grad_norm": 0.3870970421019821,
"learning_rate": 3.574616154634758e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15488159656524658,
"step": 1255,
"valid_targets_mean": 4509.9,
"valid_targets_min": 1438
},
{
"epoch": 2.0421393841166937,
"grad_norm": 0.3885177527861475,
"learning_rate": 3.569620085256062e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14700886607170105,
"step": 1260,
"valid_targets_mean": 4300.9,
"valid_targets_min": 1420
},
{
"epoch": 2.0502431118314424,
"grad_norm": 0.44324292584585834,
"learning_rate": 3.564598382570943e-05,
"loss": 0.185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14767037332057953,
"step": 1265,
"valid_targets_mean": 3636.4,
"valid_targets_min": 1430
},
{
"epoch": 2.0583468395461915,
"grad_norm": 0.397763872763852,
"learning_rate": 3.559551128588316e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16453808546066284,
"step": 1270,
"valid_targets_mean": 4420.4,
"valid_targets_min": 1350
},
{
"epoch": 2.06645056726094,
"grad_norm": 0.4902672391158386,
"learning_rate": 3.5544784057343746e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16574980318546295,
"step": 1275,
"valid_targets_mean": 4362.5,
"valid_targets_min": 1247
},
{
"epoch": 2.0745542949756888,
"grad_norm": 0.4352472097503133,
"learning_rate": 3.549380296851242e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19808019697666168,
"step": 1280,
"valid_targets_mean": 4214.6,
"valid_targets_min": 1297
},
{
"epoch": 2.0826580226904374,
"grad_norm": 0.4536384304875176,
"learning_rate": 3.544256885195616e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2267465442419052,
"step": 1285,
"valid_targets_mean": 4676.0,
"valid_targets_min": 1323
},
{
"epoch": 2.0907617504051865,
"grad_norm": 0.4698011780277878,
"learning_rate": 3.539108254437414e-05,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25781187415122986,
"step": 1290,
"valid_targets_mean": 4513.7,
"valid_targets_min": 1157
},
{
"epoch": 2.098865478119935,
"grad_norm": 0.4401070741229321,
"learning_rate": 3.5339344886584015e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21556992828845978,
"step": 1295,
"valid_targets_mean": 4360.9,
"valid_targets_min": 1437
},
{
"epoch": 2.106969205834684,
"grad_norm": 0.3792798518134474,
"learning_rate": 3.5287356723508245e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13958227634429932,
"step": 1300,
"valid_targets_mean": 4286.2,
"valid_targets_min": 1449
},
{
"epoch": 2.115072933549433,
"grad_norm": 0.45008204561893017,
"learning_rate": 3.523511890416023e-05,
"loss": 0.1716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16553236544132233,
"step": 1305,
"valid_targets_mean": 3613.5,
"valid_targets_min": 1289
},
{
"epoch": 2.1231766612641816,
"grad_norm": 0.45695133866981186,
"learning_rate": 3.518263228163051e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20444339513778687,
"step": 1310,
"valid_targets_mean": 4116.8,
"valid_targets_min": 1346
},
{
"epoch": 2.1312803889789302,
"grad_norm": 0.39290783269742174,
"learning_rate": 3.51298977130728e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1730700433254242,
"step": 1315,
"valid_targets_mean": 4396.1,
"valid_targets_min": 1342
},
{
"epoch": 2.139384116693679,
"grad_norm": 0.40014498463542075,
"learning_rate": 3.507691605968997e-05,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16938640177249908,
"step": 1320,
"valid_targets_mean": 4114.8,
"valid_targets_min": 1405
},
{
"epoch": 2.147487844408428,
"grad_norm": 0.4604317863246907,
"learning_rate": 3.5023688186720047e-05,
"loss": 0.1722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17205074429512024,
"step": 1325,
"valid_targets_mean": 4108.2,
"valid_targets_min": 1265
},
{
"epoch": 2.1555915721231766,
"grad_norm": 0.4533604714522615,
"learning_rate": 3.497021496342203e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2422681301832199,
"step": 1330,
"valid_targets_mean": 4779.9,
"valid_targets_min": 1374
},
{
"epoch": 2.1636952998379253,
"grad_norm": 0.4245083665207859,
"learning_rate": 3.491649726306168e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18867146968841553,
"step": 1335,
"valid_targets_mean": 4150.7,
"valid_targets_min": 800
},
{
"epoch": 2.1717990275526744,
"grad_norm": 0.395493334600026,
"learning_rate": 3.486253596289734e-05,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16125865280628204,
"step": 1340,
"valid_targets_mean": 4261.9,
"valid_targets_min": 931
},
{
"epoch": 2.179902755267423,
"grad_norm": 0.386658367081084,
"learning_rate": 3.4808331944165524e-05,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16777998208999634,
"step": 1345,
"valid_targets_mean": 4928.1,
"valid_targets_min": 2040
},
{
"epoch": 2.1880064829821717,
"grad_norm": 0.43589523641868716,
"learning_rate": 3.4753886092066546e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1735723465681076,
"step": 1350,
"valid_targets_mean": 4623.9,
"valid_targets_min": 1491
},
{
"epoch": 2.1961102106969204,
"grad_norm": 0.4408530475086916,
"learning_rate": 3.469919929575012e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18745142221450806,
"step": 1355,
"valid_targets_mean": 4525.6,
"valid_targets_min": 1432
},
{
"epoch": 2.2042139384116695,
"grad_norm": 0.4038864126061987,
"learning_rate": 3.464427244830076e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20079880952835083,
"step": 1360,
"valid_targets_mean": 5277.9,
"valid_targets_min": 2301
},
{
"epoch": 2.212317666126418,
"grad_norm": 0.4076427396108117,
"learning_rate": 3.458910644672324e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.216787189245224,
"step": 1365,
"valid_targets_mean": 4685.8,
"valid_targets_min": 1483
},
{
"epoch": 2.2204213938411668,
"grad_norm": 0.4855663407841619,
"learning_rate": 3.453370219192794e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19118541479110718,
"step": 1370,
"valid_targets_mean": 4399.9,
"valid_targets_min": 2187
},
{
"epoch": 2.228525121555916,
"grad_norm": 0.3994628496568297,
"learning_rate": 3.4478060588716116e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14572611451148987,
"step": 1375,
"valid_targets_mean": 4617.7,
"valid_targets_min": 861
},
{
"epoch": 2.2366288492706645,
"grad_norm": 0.3932883085770016,
"learning_rate": 3.442218254576516e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1831832379102707,
"step": 1380,
"valid_targets_mean": 4674.9,
"valid_targets_min": 1402
},
{
"epoch": 2.244732576985413,
"grad_norm": 0.41916131913527677,
"learning_rate": 3.436606897561372e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16581913828849792,
"step": 1385,
"valid_targets_mean": 3935.7,
"valid_targets_min": 715
},
{
"epoch": 2.2528363047001623,
"grad_norm": 0.39450553784213077,
"learning_rate": 3.430972079464682e-05,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16457019746303558,
"step": 1390,
"valid_targets_mean": 4476.0,
"valid_targets_min": 2399
},
{
"epoch": 2.260940032414911,
"grad_norm": 0.3982500467520962,
"learning_rate": 3.425313892308089e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18190191686153412,
"step": 1395,
"valid_targets_mean": 4379.4,
"valid_targets_min": 1290
},
{
"epoch": 2.2690437601296596,
"grad_norm": 0.41772831520986997,
"learning_rate": 3.419632428494873e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19021040201187134,
"step": 1400,
"valid_targets_mean": 4824.2,
"valid_targets_min": 1316
},
{
"epoch": 2.2771474878444082,
"grad_norm": 0.41971007165893703,
"learning_rate": 3.413927780808443e-05,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17558398842811584,
"step": 1405,
"valid_targets_mean": 4265.2,
"valid_targets_min": 1603
},
{
"epoch": 2.2852512155591573,
"grad_norm": 0.43515280086555264,
"learning_rate": 3.4082000424108235e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17722058296203613,
"step": 1410,
"valid_targets_mean": 3829.9,
"valid_targets_min": 1239
},
{
"epoch": 2.293354943273906,
"grad_norm": 0.43561699538725956,
"learning_rate": 3.402449306841128e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14969691634178162,
"step": 1415,
"valid_targets_mean": 3743.6,
"valid_targets_min": 720
},
{
"epoch": 2.3014586709886546,
"grad_norm": 0.39844393207435513,
"learning_rate": 3.396675668014035e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1564260721206665,
"step": 1420,
"valid_targets_mean": 4526.0,
"valid_targets_min": 1366
},
{
"epoch": 2.3095623987034037,
"grad_norm": 0.38012444527299505,
"learning_rate": 3.390879220218258e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1637035608291626,
"step": 1425,
"valid_targets_mean": 4802.2,
"valid_targets_min": 2401
},
{
"epoch": 2.3176661264181524,
"grad_norm": 0.4454911522622101,
"learning_rate": 3.385060058114995e-05,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19235506653785706,
"step": 1430,
"valid_targets_mean": 3851.9,
"valid_targets_min": 1369
},
{
"epoch": 2.325769854132901,
"grad_norm": 0.43173142182525054,
"learning_rate": 3.379218276736393e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16525980830192566,
"step": 1435,
"valid_targets_mean": 4005.5,
"valid_targets_min": 1307
},
{
"epoch": 2.3338735818476497,
"grad_norm": 0.4623667736311442,
"learning_rate": 3.373353971483992e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18194140493869781,
"step": 1440,
"valid_targets_mean": 4458.6,
"valid_targets_min": 1463
},
{
"epoch": 2.341977309562399,
"grad_norm": 0.43331675656237917,
"learning_rate": 3.367467238127165e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2014952003955841,
"step": 1445,
"valid_targets_mean": 4562.3,
"valid_targets_min": 1395
},
{
"epoch": 2.3500810372771475,
"grad_norm": 0.4436223038884395,
"learning_rate": 3.361558172801558e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19612324237823486,
"step": 1450,
"valid_targets_mean": 3939.1,
"valid_targets_min": 1480
},
{
"epoch": 2.358184764991896,
"grad_norm": 0.4077226858119085,
"learning_rate": 3.355626872007518e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17097198963165283,
"step": 1455,
"valid_targets_mean": 4233.2,
"valid_targets_min": 1463
},
{
"epoch": 2.366288492706645,
"grad_norm": 0.3959886507466225,
"learning_rate": 3.3496734326085154e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17004629969596863,
"step": 1460,
"valid_targets_mean": 4284.9,
"valid_targets_min": 1358
},
{
"epoch": 2.374392220421394,
"grad_norm": 0.3684059118907128,
"learning_rate": 3.3436979518295674e-05,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20196950435638428,
"step": 1465,
"valid_targets_mean": 6075.1,
"valid_targets_min": 1361
},
{
"epoch": 2.3824959481361425,
"grad_norm": 0.3545113971679958,
"learning_rate": 3.337700527255643e-05,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15890374779701233,
"step": 1470,
"valid_targets_mean": 5087.4,
"valid_targets_min": 1455
},
{
"epoch": 2.3905996758508916,
"grad_norm": 0.3840316800210763,
"learning_rate": 3.331681256830074e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505197286605835,
"step": 1475,
"valid_targets_mean": 4215.2,
"valid_targets_min": 1356
},
{
"epoch": 2.3987034035656403,
"grad_norm": 0.37876560844311763,
"learning_rate": 3.325640238852958e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1649443656206131,
"step": 1480,
"valid_targets_mean": 4721.5,
"valid_targets_min": 1414
},
{
"epoch": 2.406807131280389,
"grad_norm": 0.36497991834361543,
"learning_rate": 3.319577571979544e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684037744998932,
"step": 1485,
"valid_targets_mean": 5173.7,
"valid_targets_min": 1511
},
{
"epoch": 2.4149108589951376,
"grad_norm": 0.418707067779524,
"learning_rate": 3.313493355218632e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20251314342021942,
"step": 1490,
"valid_targets_mean": 5805.2,
"valid_targets_min": 3142
},
{
"epoch": 2.4230145867098867,
"grad_norm": 0.3779593561527125,
"learning_rate": 3.307387687930947e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20684057474136353,
"step": 1495,
"valid_targets_mean": 5985.4,
"valid_targets_min": 1380
},
{
"epoch": 2.4311183144246353,
"grad_norm": 0.42380788528949165,
"learning_rate": 3.301260669827524e-05,
"loss": 0.1748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20908914506435394,
"step": 1500,
"valid_targets_mean": 5506.3,
"valid_targets_min": 1379
},
{
"epoch": 2.439222042139384,
"grad_norm": 0.43809464646488216,
"learning_rate": 3.295112400968073e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1538805365562439,
"step": 1505,
"valid_targets_mean": 3471.2,
"valid_targets_min": 1307
},
{
"epoch": 2.447325769854133,
"grad_norm": 0.45057766440485186,
"learning_rate": 3.2889429817593494e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14621488749980927,
"step": 1510,
"valid_targets_mean": 5778.6,
"valid_targets_min": 1370
},
{
"epoch": 2.4554294975688817,
"grad_norm": 0.46698315776014765,
"learning_rate": 3.2827525129535135e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16353151202201843,
"step": 1515,
"valid_targets_mean": 3501.4,
"valid_targets_min": 1103
},
{
"epoch": 2.4635332252836304,
"grad_norm": 0.3562496067632637,
"learning_rate": 3.276541095646482e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15975715219974518,
"step": 1520,
"valid_targets_mean": 5539.9,
"valid_targets_min": 1481
},
{
"epoch": 2.471636952998379,
"grad_norm": 0.36221972351349063,
"learning_rate": 3.2703088312762825e-05,
"loss": 0.1879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14780882000923157,
"step": 1525,
"valid_targets_mean": 4646.3,
"valid_targets_min": 1338
},
{
"epoch": 2.479740680713128,
"grad_norm": 0.4051828309440133,
"learning_rate": 3.2640558216213914e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16273058950901031,
"step": 1530,
"valid_targets_mean": 4293.0,
"valid_targets_min": 1364
},
{
"epoch": 2.487844408427877,
"grad_norm": 0.42177182526238644,
"learning_rate": 3.2577821687990764e-05,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16551074385643005,
"step": 1535,
"valid_targets_mean": 3971.9,
"valid_targets_min": 1276
},
{
"epoch": 2.4959481361426255,
"grad_norm": 0.42852114939450653,
"learning_rate": 3.2514879752637236e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19772499799728394,
"step": 1540,
"valid_targets_mean": 4545.6,
"valid_targets_min": 1195
},
{
"epoch": 2.5040518638573745,
"grad_norm": 0.3858613190702104,
"learning_rate": 3.2451733438051705e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14023137092590332,
"step": 1545,
"valid_targets_mean": 4263.2,
"valid_targets_min": 1366
},
{
"epoch": 2.512155591572123,
"grad_norm": 0.45356793401017254,
"learning_rate": 3.238838377547023e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16204509139060974,
"step": 1550,
"valid_targets_mean": 3907.6,
"valid_targets_min": 844
},
{
"epoch": 2.520259319286872,
"grad_norm": 0.40037894398264473,
"learning_rate": 3.2324831799449724e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17270907759666443,
"step": 1555,
"valid_targets_mean": 4516.8,
"valid_targets_min": 2478
},
{
"epoch": 2.528363047001621,
"grad_norm": 0.40844298271631924,
"learning_rate": 3.226107854785106e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686622053384781,
"step": 1560,
"valid_targets_mean": 4280.8,
"valid_targets_min": 1433
},
{
"epoch": 2.5364667747163696,
"grad_norm": 0.3902243378177505,
"learning_rate": 3.2197125061822135e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18913598358631134,
"step": 1565,
"valid_targets_mean": 5352.0,
"valid_targets_min": 1356
},
{
"epoch": 2.5445705024311183,
"grad_norm": 0.44643382348376237,
"learning_rate": 3.213297238578082e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1804146021604538,
"step": 1570,
"valid_targets_mean": 3832.6,
"valid_targets_min": 1416
},
{
"epoch": 2.5526742301458674,
"grad_norm": 0.3677125080484775,
"learning_rate": 3.206862156739799e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17965905368328094,
"step": 1575,
"valid_targets_mean": 5295.1,
"valid_targets_min": 1944
},
{
"epoch": 2.560777957860616,
"grad_norm": 0.424694281418007,
"learning_rate": 3.2004073657580314e-05,
"loss": 0.1701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16907522082328796,
"step": 1580,
"valid_targets_mean": 4285.1,
"valid_targets_min": 1325
},
{
"epoch": 2.5688816855753647,
"grad_norm": 0.3836005236671189,
"learning_rate": 3.193932971045316e-05,
"loss": 0.1671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1842470020055771,
"step": 1585,
"valid_targets_mean": 5091.1,
"valid_targets_min": 2127
},
{
"epoch": 2.5769854132901133,
"grad_norm": 0.42016506443574564,
"learning_rate": 3.187439078334338e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18808531761169434,
"step": 1590,
"valid_targets_mean": 4131.1,
"valid_targets_min": 1279
},
{
"epoch": 2.585089141004862,
"grad_norm": 0.39085605322357647,
"learning_rate": 3.180925793676199e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17691290378570557,
"step": 1595,
"valid_targets_mean": 4609.9,
"valid_targets_min": 1309
},
{
"epoch": 2.593192868719611,
"grad_norm": 0.3909121224465065,
"learning_rate": 3.1743932234386905e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15855155885219574,
"step": 1600,
"valid_targets_mean": 4398.2,
"valid_targets_min": 2216
},
{
"epoch": 2.6012965964343597,
"grad_norm": 0.36211045372400313,
"learning_rate": 3.167841474304555e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17921733856201172,
"step": 1605,
"valid_targets_mean": 5015.9,
"valid_targets_min": 1357
},
{
"epoch": 2.6094003241491084,
"grad_norm": 0.37957996352532186,
"learning_rate": 3.161270653269743e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18475927412509918,
"step": 1610,
"valid_targets_mean": 5157.6,
"valid_targets_min": 2993
},
{
"epoch": 2.6175040518638575,
"grad_norm": 0.36705428465477125,
"learning_rate": 3.154680867641666e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19124308228492737,
"step": 1615,
"valid_targets_mean": 5468.5,
"valid_targets_min": 1530
},
{
"epoch": 2.625607779578606,
"grad_norm": 0.424405031181383,
"learning_rate": 3.1480722250374454e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20675238966941833,
"step": 1620,
"valid_targets_mean": 5237.4,
"valid_targets_min": 1502
},
{
"epoch": 2.633711507293355,
"grad_norm": 0.3963476176633248,
"learning_rate": 3.1414448333821526e-05,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1941150426864624,
"step": 1625,
"valid_targets_mean": 4785.1,
"valid_targets_min": 2163
},
{
"epoch": 2.641815235008104,
"grad_norm": 0.41204588126736313,
"learning_rate": 3.1347988009070496e-05,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21974653005599976,
"step": 1630,
"valid_targets_mean": 4643.4,
"valid_targets_min": 2384
},
{
"epoch": 2.6499189627228525,
"grad_norm": 0.348197515719351,
"learning_rate": 3.1281342361478184e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14443612098693848,
"step": 1635,
"valid_targets_mean": 4822.6,
"valid_targets_min": 2198
},
{
"epoch": 2.658022690437601,
"grad_norm": 0.43986322837355346,
"learning_rate": 3.121451247942789e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20639345049858093,
"step": 1640,
"valid_targets_mean": 4152.5,
"valid_targets_min": 1306
},
{
"epoch": 2.6661264181523503,
"grad_norm": 0.38870221906381547,
"learning_rate": 3.1147499454311654e-05,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18374845385551453,
"step": 1645,
"valid_targets_mean": 4483.2,
"valid_targets_min": 848
},
{
"epoch": 2.674230145867099,
"grad_norm": 0.36761988123246936,
"learning_rate": 3.1080304380512386e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14270418882369995,
"step": 1650,
"valid_targets_mean": 4992.8,
"valid_targets_min": 2372
},
{
"epoch": 2.6823338735818476,
"grad_norm": 0.39358600764755813,
"learning_rate": 3.101292835538602e-05,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18195050954818726,
"step": 1655,
"valid_targets_mean": 5848.4,
"valid_targets_min": 2184
},
{
"epoch": 2.6904376012965967,
"grad_norm": 0.38005284644189086,
"learning_rate": 3.0945372479243605e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.175418421626091,
"step": 1660,
"valid_targets_mean": 4281.4,
"valid_targets_min": 1260
},
{
"epoch": 2.6985413290113454,
"grad_norm": 0.4499877538649714,
"learning_rate": 3.087763785533328e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2106286883354187,
"step": 1665,
"valid_targets_mean": 3791.6,
"valid_targets_min": 1351
},
{
"epoch": 2.706645056726094,
"grad_norm": 0.4022005851852449,
"learning_rate": 3.0809725589822325e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18053220212459564,
"step": 1670,
"valid_targets_mean": 4554.2,
"valid_targets_min": 2254
},
{
"epoch": 2.7147487844408427,
"grad_norm": 0.38257462905088174,
"learning_rate": 3.074163679177907e-05,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21444633603096008,
"step": 1675,
"valid_targets_mean": 5958.8,
"valid_targets_min": 2338
},
{
"epoch": 2.7228525121555913,
"grad_norm": 0.4439641195628155,
"learning_rate": 3.067337257315477e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23471331596374512,
"step": 1680,
"valid_targets_mean": 4376.6,
"valid_targets_min": 2428
},
{
"epoch": 2.7309562398703404,
"grad_norm": 0.49885017003598664,
"learning_rate": 3.0604934048765444e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17425662279129028,
"step": 1685,
"valid_targets_mean": 3140.1,
"valid_targets_min": 1142
},
{
"epoch": 2.739059967585089,
"grad_norm": 0.39244438059170533,
"learning_rate": 3.05363223362737e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.177323579788208,
"step": 1690,
"valid_targets_mean": 4580.3,
"valid_targets_min": 1184
},
{
"epoch": 2.7471636952998377,
"grad_norm": 0.43590713281508214,
"learning_rate": 3.0467538556170463e-05,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19646786153316498,
"step": 1695,
"valid_targets_mean": 3882.8,
"valid_targets_min": 1316
},
{
"epoch": 2.755267423014587,
"grad_norm": 0.4140052856791728,
"learning_rate": 3.0398583831756655e-05,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17302680015563965,
"step": 1700,
"valid_targets_mean": 4188.7,
"valid_targets_min": 1384
},
{
"epoch": 2.7633711507293355,
"grad_norm": 0.42351239820043063,
"learning_rate": 3.03294592891249e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16667763888835907,
"step": 1705,
"valid_targets_mean": 4216.1,
"valid_targets_min": 1394
},
{
"epoch": 2.771474878444084,
"grad_norm": 0.4690366006019746,
"learning_rate": 3.0260166057141086e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17848166823387146,
"step": 1710,
"valid_targets_mean": 3578.8,
"valid_targets_min": 1101
},
{
"epoch": 2.7795786061588332,
"grad_norm": 0.5127351606909685,
"learning_rate": 3.0190705267425956e-05,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2254772037267685,
"step": 1715,
"valid_targets_mean": 3151.7,
"valid_targets_min": 1365
},
{
"epoch": 2.787682333873582,
"grad_norm": 0.47576208857320945,
"learning_rate": 3.0121078054336633e-05,
"loss": 0.1912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18778353929519653,
"step": 1720,
"valid_targets_mean": 3748.5,
"valid_targets_min": 714
},
{
"epoch": 2.7957860615883305,
"grad_norm": 0.4531881309902607,
"learning_rate": 3.005128555494806e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19288434088230133,
"step": 1725,
"valid_targets_mean": 5238.9,
"valid_targets_min": 1646
},
{
"epoch": 2.8038897893030796,
"grad_norm": 0.37505653972841513,
"learning_rate": 2.998132890903448e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1486460566520691,
"step": 1730,
"valid_targets_mean": 4244.6,
"valid_targets_min": 1485
},
{
"epoch": 2.8119935170178283,
"grad_norm": 0.3972142880917285,
"learning_rate": 2.9911209259050763e-05,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21991488337516785,
"step": 1735,
"valid_targets_mean": 5093.3,
"valid_targets_min": 707
},
{
"epoch": 2.820097244732577,
"grad_norm": 0.4265599882568908,
"learning_rate": 2.984092775011382e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17646397650241852,
"step": 1740,
"valid_targets_mean": 3938.9,
"valid_targets_min": 1270
},
{
"epoch": 2.828200972447326,
"grad_norm": 0.4228912084128686,
"learning_rate": 2.9770485529983834e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18994967639446259,
"step": 1745,
"valid_targets_mean": 4213.4,
"valid_targets_min": 300
},
{
"epoch": 2.8363047001620747,
"grad_norm": 0.373449509905702,
"learning_rate": 2.9699883749045564e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1784120500087738,
"step": 1750,
"valid_targets_mean": 4853.6,
"valid_targets_min": 987
},
{
"epoch": 2.8444084278768234,
"grad_norm": 0.393297545157333,
"learning_rate": 2.962912356028953e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601720005273819,
"step": 1755,
"valid_targets_mean": 4341.7,
"valid_targets_min": 1457
},
{
"epoch": 2.852512155591572,
"grad_norm": 0.39420593273198135,
"learning_rate": 2.95582061192932e-05,
"loss": 0.1766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16387531161308289,
"step": 1760,
"valid_targets_mean": 4608.4,
"valid_targets_min": 1457
},
{
"epoch": 2.8606158833063207,
"grad_norm": 0.45248636903908407,
"learning_rate": 2.9487132584202115e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17816318571567535,
"step": 1765,
"valid_targets_mean": 4026.9,
"valid_targets_min": 736
},
{
"epoch": 2.8687196110210698,
"grad_norm": 0.4420996590189512,
"learning_rate": 2.9415904115710964e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1964389532804489,
"step": 1770,
"valid_targets_mean": 4062.7,
"valid_targets_min": 1477
},
{
"epoch": 2.8768233387358184,
"grad_norm": 0.3731738506531456,
"learning_rate": 2.9344521877044633e-05,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585400551557541,
"step": 1775,
"valid_targets_mean": 4726.6,
"valid_targets_min": 1585
},
{
"epoch": 2.884927066450567,
"grad_norm": 0.4165595181612634,
"learning_rate": 2.927298703393924e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13799604773521423,
"step": 1780,
"valid_targets_mean": 3671.0,
"valid_targets_min": 1361
},
{
"epoch": 2.893030794165316,
"grad_norm": 0.4273575398894236,
"learning_rate": 2.9201300754623046e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18003098666667938,
"step": 1785,
"valid_targets_mean": 4422.1,
"valid_targets_min": 882
},
{
"epoch": 2.901134521880065,
"grad_norm": 0.3639663217266001,
"learning_rate": 2.9129464209797404e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.199708953499794,
"step": 1790,
"valid_targets_mean": 5779.1,
"valid_targets_min": 1363
},
{
"epoch": 2.9092382495948135,
"grad_norm": 0.3843377653988568,
"learning_rate": 2.9057478572617644e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15898755192756653,
"step": 1795,
"valid_targets_mean": 4513.2,
"valid_targets_min": 1493
},
{
"epoch": 2.9173419773095626,
"grad_norm": 0.41883027314954663,
"learning_rate": 2.898534501867391e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2081822007894516,
"step": 1800,
"valid_targets_mean": 4719.1,
"valid_targets_min": 1112
},
{
"epoch": 2.9254457050243112,
"grad_norm": 0.4313248963680573,
"learning_rate": 2.8913064725971947e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.176205113530159,
"step": 1805,
"valid_targets_mean": 4301.3,
"valid_targets_min": 1469
},
{
"epoch": 2.93354943273906,
"grad_norm": 0.3577726246588782,
"learning_rate": 2.8840638874913894e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21595324575901031,
"step": 1810,
"valid_targets_mean": 5801.4,
"valid_targets_min": 1025
},
{
"epoch": 2.941653160453809,
"grad_norm": 0.40431026504522666,
"learning_rate": 2.8768068648278976e-05,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15173974633216858,
"step": 1815,
"valid_targets_mean": 4143.2,
"valid_targets_min": 614
},
{
"epoch": 2.9497568881685576,
"grad_norm": 0.4056315860760992,
"learning_rate": 2.8695355231204206e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18253010511398315,
"step": 1820,
"valid_targets_mean": 4631.1,
"valid_targets_min": 1584
},
{
"epoch": 2.9578606158833063,
"grad_norm": 0.3605840500101974,
"learning_rate": 2.862249981116502e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17268909513950348,
"step": 1825,
"valid_targets_mean": 4815.9,
"valid_targets_min": 1465
},
{
"epoch": 2.965964343598055,
"grad_norm": 0.4393224667022168,
"learning_rate": 2.854950357795589e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1699746996164322,
"step": 1830,
"valid_targets_mean": 3549.6,
"valid_targets_min": 587
},
{
"epoch": 2.974068071312804,
"grad_norm": 0.4084908609658448,
"learning_rate": 2.847636772367091e-05,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18084849417209625,
"step": 1835,
"valid_targets_mean": 4688.5,
"valid_targets_min": 965
},
{
"epoch": 2.9821717990275527,
"grad_norm": 0.3904995138540871,
"learning_rate": 2.8403093442684287e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17414742708206177,
"step": 1840,
"valid_targets_mean": 4738.1,
"valid_targets_min": 1333
},
{
"epoch": 2.9902755267423013,
"grad_norm": 0.3986330323947676,
"learning_rate": 2.8329681931630877e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1696147918701172,
"step": 1845,
"valid_targets_mean": 4719.2,
"valid_targets_min": 1508
},
{
"epoch": 2.99837925445705,
"grad_norm": 0.3738285751356821,
"learning_rate": 2.825613438938663e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16895028948783875,
"step": 1850,
"valid_targets_mean": 4317.1,
"valid_targets_min": 1512
},
{
"epoch": 3.006482982171799,
"grad_norm": 0.4458576556741155,
"learning_rate": 2.8182452017048983e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20063985884189606,
"step": 1855,
"valid_targets_mean": 3893.2,
"valid_targets_min": 1938
},
{
"epoch": 3.0145867098865478,
"grad_norm": 0.5437818382202464,
"learning_rate": 2.81086360179173e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13127049803733826,
"step": 1860,
"valid_targets_mean": 3906.6,
"valid_targets_min": 1366
},
{
"epoch": 3.0226904376012964,
"grad_norm": 0.7414088618069266,
"learning_rate": 2.8034687597473164e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14226055145263672,
"step": 1865,
"valid_targets_mean": 4408.1,
"valid_targets_min": 2015
},
{
"epoch": 3.0307941653160455,
"grad_norm": 0.3958731743842448,
"learning_rate": 2.796060796336074e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14440515637397766,
"step": 1870,
"valid_targets_mean": 3883.9,
"valid_targets_min": 1145
},
{
"epoch": 3.038897893030794,
"grad_norm": 0.3863363231479288,
"learning_rate": 2.7886398325367018e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1541876196861267,
"step": 1875,
"valid_targets_mean": 4888.3,
"valid_targets_min": 1409
},
{
"epoch": 3.047001620745543,
"grad_norm": 0.38862351941958634,
"learning_rate": 2.7812059895402064e-05,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17312254011631012,
"step": 1880,
"valid_targets_mean": 4551.8,
"valid_targets_min": 1201
},
{
"epoch": 3.055105348460292,
"grad_norm": 0.40110635229720293,
"learning_rate": 2.773759388747925e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14018696546554565,
"step": 1885,
"valid_targets_mean": 4621.5,
"valid_targets_min": 1347
},
{
"epoch": 3.0632090761750406,
"grad_norm": 0.5140462329460982,
"learning_rate": 2.7663001517695386e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14781486988067627,
"step": 1890,
"valid_targets_mean": 4935.8,
"valid_targets_min": 2293
},
{
"epoch": 3.0713128038897892,
"grad_norm": 0.4632445118213682,
"learning_rate": 2.7588284004210907e-05,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17635850608348846,
"step": 1895,
"valid_targets_mean": 3667.7,
"valid_targets_min": 842
},
{
"epoch": 3.079416531604538,
"grad_norm": 0.4140405136032335,
"learning_rate": 2.7513442567229936e-05,
"loss": 0.162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16254425048828125,
"step": 1900,
"valid_targets_mean": 3994.1,
"valid_targets_min": 2484
},
{
"epoch": 3.087520259319287,
"grad_norm": 0.4340338509048081,
"learning_rate": 2.7438478428980407e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579328179359436,
"step": 1905,
"valid_targets_mean": 3750.8,
"valid_targets_min": 1366
},
{
"epoch": 3.0956239870340356,
"grad_norm": 0.45026657211719584,
"learning_rate": 2.7363392813694047e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.178205206990242,
"step": 1910,
"valid_targets_mean": 3745.9,
"valid_targets_min": 1358
},
{
"epoch": 3.1037277147487843,
"grad_norm": 0.4337354223525519,
"learning_rate": 2.7288186947586426e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1774899810552597,
"step": 1915,
"valid_targets_mean": 4129.7,
"valid_targets_min": 999
},
{
"epoch": 3.1118314424635334,
"grad_norm": 0.42347076906338227,
"learning_rate": 2.7212862058836925e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14904651045799255,
"step": 1920,
"valid_targets_mean": 3875.8,
"valid_targets_min": 1281
},
{
"epoch": 3.119935170178282,
"grad_norm": 0.405451275894032,
"learning_rate": 2.713741937756865e-05,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13380369544029236,
"step": 1925,
"valid_targets_mean": 3421.6,
"valid_targets_min": 676
},
{
"epoch": 3.1280388978930307,
"grad_norm": 0.3967232066747482,
"learning_rate": 2.7061860135828384e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1519922912120819,
"step": 1930,
"valid_targets_mean": 4485.6,
"valid_targets_min": 1366
},
{
"epoch": 3.1361426256077793,
"grad_norm": 0.39244088979289066,
"learning_rate": 2.6986185567566442e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16591840982437134,
"step": 1935,
"valid_targets_mean": 5006.6,
"valid_targets_min": 1399
},
{
"epoch": 3.1442463533225284,
"grad_norm": 0.45152809145456724,
"learning_rate": 2.6910396908616527e-05,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18249057233333588,
"step": 1940,
"valid_targets_mean": 4102.7,
"valid_targets_min": 1358
},
{
"epoch": 3.152350081037277,
"grad_norm": 0.3925517166211551,
"learning_rate": 2.6834495396675526e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1807394027709961,
"step": 1945,
"valid_targets_mean": 5163.2,
"valid_targets_min": 2123
},
{
"epoch": 3.1604538087520258,
"grad_norm": 0.37615773969729294,
"learning_rate": 2.6758482271283347e-05,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15303456783294678,
"step": 1950,
"valid_targets_mean": 4954.9,
"valid_targets_min": 1379
},
{
"epoch": 3.168557536466775,
"grad_norm": 0.3825435765582147,
"learning_rate": 2.668235877380263e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14769810438156128,
"step": 1955,
"valid_targets_mean": 4466.6,
"valid_targets_min": 1899
},
{
"epoch": 3.1766612641815235,
"grad_norm": 0.5029144947784785,
"learning_rate": 2.660612614739849e-05,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18598952889442444,
"step": 1960,
"valid_targets_mean": 3101.1,
"valid_targets_min": 844
},
{
"epoch": 3.184764991896272,
"grad_norm": 0.3831787296377238,
"learning_rate": 2.652978563701822e-05,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1297546774148941,
"step": 1965,
"valid_targets_mean": 4340.1,
"valid_targets_min": 1250
},
{
"epoch": 3.1928687196110213,
"grad_norm": 0.4144693596376343,
"learning_rate": 2.645333848937095e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14467677474021912,
"step": 1970,
"valid_targets_mean": 3855.9,
"valid_targets_min": 1517
},
{
"epoch": 3.20097244732577,
"grad_norm": 0.42457591777397313,
"learning_rate": 2.6376785952907292e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1861054003238678,
"step": 1975,
"valid_targets_mean": 4458.5,
"valid_targets_min": 1381
},
{
"epoch": 3.2090761750405186,
"grad_norm": 0.39434289936014905,
"learning_rate": 2.630012927779896e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16375955939292908,
"step": 1980,
"valid_targets_mean": 4505.0,
"valid_targets_min": 1465
},
{
"epoch": 3.217179902755267,
"grad_norm": 0.4022197268623526,
"learning_rate": 2.6223369715918338e-05,
"loss": 0.1785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17773842811584473,
"step": 1985,
"valid_targets_mean": 5042.1,
"valid_targets_min": 2203
},
{
"epoch": 3.2252836304700163,
"grad_norm": 0.42080806470642895,
"learning_rate": 2.614650852081805e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16340884566307068,
"step": 1990,
"valid_targets_mean": 4147.1,
"valid_targets_min": 1395
},
{
"epoch": 3.233387358184765,
"grad_norm": 0.39877594715149084,
"learning_rate": 2.606954694771047e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19070208072662354,
"step": 1995,
"valid_targets_mean": 5167.7,
"valid_targets_min": 2503
},
{
"epoch": 3.2414910858995136,
"grad_norm": 0.4170345486796608,
"learning_rate": 2.5992486253447258e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16822439432144165,
"step": 2000,
"valid_targets_mean": 4404.3,
"valid_targets_min": 1622
},
{
"epoch": 3.2495948136142627,
"grad_norm": 0.3891233710055621,
"learning_rate": 2.5915327696498787e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17434442043304443,
"step": 2005,
"valid_targets_mean": 5199.5,
"valid_targets_min": 932
},
{
"epoch": 3.2576985413290114,
"grad_norm": 0.34701884376339476,
"learning_rate": 2.583807253693362e-05,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562272012233734,
"step": 2010,
"valid_targets_mean": 5518.5,
"valid_targets_min": 848
},
{
"epoch": 3.26580226904376,
"grad_norm": 0.41218355325803036,
"learning_rate": 2.576072203639794e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15922808647155762,
"step": 2015,
"valid_targets_mean": 4113.3,
"valid_targets_min": 1485
},
{
"epoch": 3.2739059967585087,
"grad_norm": 0.4109547934633965,
"learning_rate": 2.5683277458094926e-05,
"loss": 0.1676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16199171543121338,
"step": 2020,
"valid_targets_mean": 4417.1,
"valid_targets_min": 1268
},
{
"epoch": 3.282009724473258,
"grad_norm": 0.3744324756824404,
"learning_rate": 2.560574006676413e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1650342345237732,
"step": 2025,
"valid_targets_mean": 5119.9,
"valid_targets_min": 1402
},
{
"epoch": 3.2901134521880064,
"grad_norm": 0.3996207068608718,
"learning_rate": 2.5528111128660826e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18693450093269348,
"step": 2030,
"valid_targets_mean": 5332.9,
"valid_targets_min": 1422
},
{
"epoch": 3.298217179902755,
"grad_norm": 0.3949609988006854,
"learning_rate": 2.545039191153533e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1728595793247223,
"step": 2035,
"valid_targets_mean": 4955.7,
"valid_targets_min": 1467
},
{
"epoch": 3.306320907617504,
"grad_norm": 0.4139286573888577,
"learning_rate": 2.53725836846123e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1731775999069214,
"step": 2040,
"valid_targets_mean": 4870.6,
"valid_targets_min": 2364
},
{
"epoch": 3.314424635332253,
"grad_norm": 0.39980850038411364,
"learning_rate": 2.5294687718569994e-05,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17138364911079407,
"step": 2045,
"valid_targets_mean": 4727.1,
"valid_targets_min": 1195
},
{
"epoch": 3.3225283630470015,
"grad_norm": 0.4296995400998342,
"learning_rate": 2.5216705285519525e-05,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14280448853969574,
"step": 2050,
"valid_targets_mean": 3781.5,
"valid_targets_min": 1393
},
{
"epoch": 3.3306320907617506,
"grad_norm": 0.3962285375649505,
"learning_rate": 2.5138637658984116e-05,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752699315547943,
"step": 2055,
"valid_targets_mean": 4631.1,
"valid_targets_min": 595
},
{
"epoch": 3.3387358184764993,
"grad_norm": 0.4211633580398836,
"learning_rate": 2.5060486113878244e-05,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16262900829315186,
"step": 2060,
"valid_targets_mean": 4000.8,
"valid_targets_min": 1298
},
{
"epoch": 3.346839546191248,
"grad_norm": 0.3968558871252429,
"learning_rate": 2.4982251926486873e-05,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1583396941423416,
"step": 2065,
"valid_targets_mean": 4512.4,
"valid_targets_min": 1316
},
{
"epoch": 3.354943273905997,
"grad_norm": 0.41675904818776327,
"learning_rate": 2.490393637444458e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1787576675415039,
"step": 2070,
"valid_targets_mean": 5438.1,
"valid_targets_min": 1668
},
{
"epoch": 3.3630470016207457,
"grad_norm": 0.3822854208050519,
"learning_rate": 2.482554073671471e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1810203194618225,
"step": 2075,
"valid_targets_mean": 4925.5,
"valid_targets_min": 641
},
{
"epoch": 3.3711507293354943,
"grad_norm": 0.3746793390777653,
"learning_rate": 2.4747066293568452e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1479102522134781,
"step": 2080,
"valid_targets_mean": 4342.9,
"valid_targets_min": 1357
},
{
"epoch": 3.379254457050243,
"grad_norm": 0.4169494009407781,
"learning_rate": 2.4668514326564e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17268824577331543,
"step": 2085,
"valid_targets_mean": 4090.0,
"valid_targets_min": 1306
},
{
"epoch": 3.387358184764992,
"grad_norm": 0.42376297596655554,
"learning_rate": 2.4589886118525556e-05,
"loss": 0.1579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13542214035987854,
"step": 2090,
"valid_targets_mean": 3641.6,
"valid_targets_min": 1265
},
{
"epoch": 3.3954619124797407,
"grad_norm": 0.35964018388907254,
"learning_rate": 2.4511182953522405e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18550920486450195,
"step": 2095,
"valid_targets_mean": 6288.9,
"valid_targets_min": 2357
},
{
"epoch": 3.4035656401944894,
"grad_norm": 0.420468377931095,
"learning_rate": 2.4432406116847954e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15402904152870178,
"step": 2100,
"valid_targets_mean": 3651.9,
"valid_targets_min": 1443
},
{
"epoch": 3.411669367909238,
"grad_norm": 0.3480070041971189,
"learning_rate": 2.435355689499874e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15732459723949432,
"step": 2105,
"valid_targets_mean": 5594.8,
"valid_targets_min": 1491
},
{
"epoch": 3.419773095623987,
"grad_norm": 0.43677187908434917,
"learning_rate": 2.4274636575653398e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1524367332458496,
"step": 2110,
"valid_targets_mean": 4121.1,
"valid_targets_min": 1403
},
{
"epoch": 3.427876823338736,
"grad_norm": 0.39059587976025334,
"learning_rate": 2.4195646447651663e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16522473096847534,
"step": 2115,
"valid_targets_mean": 5062.4,
"valid_targets_min": 944
},
{
"epoch": 3.4359805510534844,
"grad_norm": 0.3852515258101976,
"learning_rate": 2.411658780097331e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1708238273859024,
"step": 2120,
"valid_targets_mean": 5137.6,
"valid_targets_min": 1333
},
{
"epoch": 3.4440842787682335,
"grad_norm": 0.389032518997545,
"learning_rate": 2.4037461926717075e-05,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17317542433738708,
"step": 2125,
"valid_targets_mean": 4953.7,
"valid_targets_min": 738
},
{
"epoch": 3.452188006482982,
"grad_norm": 0.4147483170037612,
"learning_rate": 2.395827011707959e-05,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16804209351539612,
"step": 2130,
"valid_targets_mean": 4543.6,
"valid_targets_min": 1407
},
{
"epoch": 3.460291734197731,
"grad_norm": 0.4360946325373845,
"learning_rate": 2.3879013665334258e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1393245905637741,
"step": 2135,
"valid_targets_mean": 3851.3,
"valid_targets_min": 1041
},
{
"epoch": 3.46839546191248,
"grad_norm": 0.35655609281423195,
"learning_rate": 2.3799693865810163e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14911235868930817,
"step": 2140,
"valid_targets_mean": 5114.5,
"valid_targets_min": 2426
},
{
"epoch": 3.4764991896272286,
"grad_norm": 0.45634252157298655,
"learning_rate": 2.37203120138709e-05,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24309851229190826,
"step": 2145,
"valid_targets_mean": 4436.9,
"valid_targets_min": 1453
},
{
"epoch": 3.4846029173419772,
"grad_norm": 0.42263469645641794,
"learning_rate": 2.3640869405893446e-05,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1451752930879593,
"step": 2150,
"valid_targets_mean": 4446.0,
"valid_targets_min": 1438
},
{
"epoch": 3.492706645056726,
"grad_norm": 0.39906455734326574,
"learning_rate": 2.3561367339246976e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18286089599132538,
"step": 2155,
"valid_targets_mean": 5142.6,
"valid_targets_min": 1423
},
{
"epoch": 3.500810372771475,
"grad_norm": 0.418866166123448,
"learning_rate": 2.3481807112271678e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18328286707401276,
"step": 2160,
"valid_targets_mean": 4042.1,
"valid_targets_min": 1430
},
{
"epoch": 3.5089141004862237,
"grad_norm": 0.4014900167402139,
"learning_rate": 2.3402190024257543e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15818876028060913,
"step": 2165,
"valid_targets_mean": 3847.3,
"valid_targets_min": 1412
},
{
"epoch": 3.5170178282009723,
"grad_norm": 0.36321998289056967,
"learning_rate": 2.3322517375423165e-05,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13905078172683716,
"step": 2170,
"valid_targets_mean": 4851.6,
"valid_targets_min": 1478
},
{
"epoch": 3.525121555915721,
"grad_norm": 0.4175559746072245,
"learning_rate": 2.3242790466894494e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2257763147354126,
"step": 2175,
"valid_targets_mean": 5145.1,
"valid_targets_min": 1324
},
{
"epoch": 3.53322528363047,
"grad_norm": 0.3721262066889466,
"learning_rate": 2.316301060068359e-05,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15761905908584595,
"step": 2180,
"valid_targets_mean": 4843.8,
"valid_targets_min": 2620
},
{
"epoch": 3.5413290113452187,
"grad_norm": 0.4012053491625949,
"learning_rate": 2.3083179079667347e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15592560172080994,
"step": 2185,
"valid_targets_mean": 4353.8,
"valid_targets_min": 1432
},
{
"epoch": 3.5494327390599674,
"grad_norm": 0.4375921159428318,
"learning_rate": 2.300329720756625e-05,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1943226456642151,
"step": 2190,
"valid_targets_mean": 4139.7,
"valid_targets_min": 1361
},
{
"epoch": 3.5575364667747165,
"grad_norm": 0.40049465719853394,
"learning_rate": 2.2923366288923045e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14853128790855408,
"step": 2195,
"valid_targets_mean": 4349.8,
"valid_targets_min": 1489
},
{
"epoch": 3.565640194489465,
"grad_norm": 0.3931973901766357,
"learning_rate": 2.2843387629081453e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2016703337430954,
"step": 2200,
"valid_targets_mean": 5098.6,
"valid_targets_min": 2065
},
{
"epoch": 3.5737439222042138,
"grad_norm": 0.4690674312594426,
"learning_rate": 2.2763362534164854e-05,
"loss": 0.1762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14409610629081726,
"step": 2205,
"valid_targets_mean": 4489.2,
"valid_targets_min": 1316
},
{
"epoch": 3.581847649918963,
"grad_norm": 0.3623772576301561,
"learning_rate": 2.268329231105498e-05,
"loss": 0.1712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1700354665517807,
"step": 2210,
"valid_targets_mean": 5424.8,
"valid_targets_min": 1409
},
{
"epoch": 3.5899513776337115,
"grad_norm": 0.39514612685466244,
"learning_rate": 2.2603178267370504e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2017160952091217,
"step": 2215,
"valid_targets_mean": 5409.3,
"valid_targets_min": 1364
},
{
"epoch": 3.59805510534846,
"grad_norm": 0.384040585215328,
"learning_rate": 2.2523021711445746e-05,
"loss": 0.1696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17937374114990234,
"step": 2220,
"valid_targets_mean": 4387.1,
"valid_targets_min": 1391
},
{
"epoch": 3.6061588330632093,
"grad_norm": 0.3998607141504835,
"learning_rate": 2.2442823952309308e-05,
"loss": 0.183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16963882744312286,
"step": 2225,
"valid_targets_mean": 4776.0,
"valid_targets_min": 1444
},
{
"epoch": 3.614262560777958,
"grad_norm": 0.3659718411449704,
"learning_rate": 2.2362586299662642e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1675758808851242,
"step": 2230,
"valid_targets_mean": 5171.9,
"valid_targets_min": 1385
},
{
"epoch": 3.6223662884927066,
"grad_norm": 0.3723845904154494,
"learning_rate": 2.228231006385873e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19093650579452515,
"step": 2235,
"valid_targets_mean": 5510.3,
"valid_targets_min": 1457
},
{
"epoch": 3.6304700162074557,
"grad_norm": 0.3889362488963387,
"learning_rate": 2.2201996555880633e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14821797609329224,
"step": 2240,
"valid_targets_mean": 4622.1,
"valid_targets_min": 1273
},
{
"epoch": 3.6385737439222043,
"grad_norm": 0.4083309341620573,
"learning_rate": 2.2121647087320105e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16050675511360168,
"step": 2245,
"valid_targets_mean": 4249.2,
"valid_targets_min": 1355
},
{
"epoch": 3.646677471636953,
"grad_norm": 0.40763578479365914,
"learning_rate": 2.204126297035617e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16511400043964386,
"step": 2250,
"valid_targets_mean": 4262.1,
"valid_targets_min": 1390
},
{
"epoch": 3.6547811993517016,
"grad_norm": 0.4033094775868518,
"learning_rate": 2.196084551773368e-05,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18204748630523682,
"step": 2255,
"valid_targets_mean": 4871.3,
"valid_targets_min": 1654
},
{
"epoch": 3.6628849270664503,
"grad_norm": 0.37714115301157575,
"learning_rate": 2.1880396042741906e-05,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16021430492401123,
"step": 2260,
"valid_targets_mean": 4672.0,
"valid_targets_min": 1361
},
{
"epoch": 3.6709886547811994,
"grad_norm": 0.3923717006496399,
"learning_rate": 2.179991585919307e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15458917617797852,
"step": 2265,
"valid_targets_mean": 4315.2,
"valid_targets_min": 1298
},
{
"epoch": 3.679092382495948,
"grad_norm": 0.4429131605887363,
"learning_rate": 2.1719406281400873e-05,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15454357862472534,
"step": 2270,
"valid_targets_mean": 3315.8,
"valid_targets_min": 845
},
{
"epoch": 3.6871961102106967,
"grad_norm": 0.3727256205850918,
"learning_rate": 2.163886862415908e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19542384147644043,
"step": 2275,
"valid_targets_mean": 5506.1,
"valid_targets_min": 1856
},
{
"epoch": 3.695299837925446,
"grad_norm": 0.41872269455653544,
"learning_rate": 2.155830420272e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1771114021539688,
"step": 2280,
"valid_targets_mean": 4206.1,
"valid_targets_min": 914
},
{
"epoch": 3.7034035656401945,
"grad_norm": 0.38039050268682023,
"learning_rate": 2.1477714332773022e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15340042114257812,
"step": 2285,
"valid_targets_mean": 4411.3,
"valid_targets_min": 1327
},
{
"epoch": 3.711507293354943,
"grad_norm": 0.38361661527060936,
"learning_rate": 2.139710033042314e-05,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14032137393951416,
"step": 2290,
"valid_targets_mean": 4275.1,
"valid_targets_min": 1308
},
{
"epoch": 3.719611021069692,
"grad_norm": 0.37278829695234467,
"learning_rate": 2.1316463512169453e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17240861058235168,
"step": 2295,
"valid_targets_mean": 5224.4,
"valid_targets_min": 2093
},
{
"epoch": 3.727714748784441,
"grad_norm": 0.41452369103684505,
"learning_rate": 2.1235805194883665e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15849941968917847,
"step": 2300,
"valid_targets_mean": 4130.9,
"valid_targets_min": 709
},
{
"epoch": 3.7358184764991895,
"grad_norm": 0.4105117214988862,
"learning_rate": 2.115512669578857e-05,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17380082607269287,
"step": 2305,
"valid_targets_mean": 4336.1,
"valid_targets_min": 1375
},
{
"epoch": 3.7439222042139386,
"grad_norm": 0.40472321885140583,
"learning_rate": 2.107442933243656e-05,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15123385190963745,
"step": 2310,
"valid_targets_mean": 3974.2,
"valid_targets_min": 987
},
{
"epoch": 3.7520259319286873,
"grad_norm": 0.39922382065316403,
"learning_rate": 2.099371442268809e-05,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1767762154340744,
"step": 2315,
"valid_targets_mean": 5035.8,
"valid_targets_min": 1275
},
{
"epoch": 3.760129659643436,
"grad_norm": 0.40427130510941617,
"learning_rate": 2.0912983284690157e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16852274537086487,
"step": 2320,
"valid_targets_mean": 4461.9,
"valid_targets_min": 1182
},
{
"epoch": 3.768233387358185,
"grad_norm": 0.36533036313023187,
"learning_rate": 2.0832237236854794e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1574646532535553,
"step": 2325,
"valid_targets_mean": 5237.7,
"valid_targets_min": 2002
},
{
"epoch": 3.7763371150729337,
"grad_norm": 0.4491625565997479,
"learning_rate": 2.0751477597837528e-05,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15878888964653015,
"step": 2330,
"valid_targets_mean": 3329.7,
"valid_targets_min": 1413
},
{
"epoch": 3.7844408427876823,
"grad_norm": 0.42508704076737175,
"learning_rate": 2.0670705686515822e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17809738218784332,
"step": 2335,
"valid_targets_mean": 4440.5,
"valid_targets_min": 1481
},
{
"epoch": 3.792544570502431,
"grad_norm": 0.368677101634329,
"learning_rate": 2.0589922821967566e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14476372301578522,
"step": 2340,
"valid_targets_mean": 4738.7,
"valid_targets_min": 2581
},
{
"epoch": 3.8006482982171796,
"grad_norm": 0.3513444622347881,
"learning_rate": 2.0509130323449545e-05,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14614984393119812,
"step": 2345,
"valid_targets_mean": 5030.6,
"valid_targets_min": 1391
},
{
"epoch": 3.8087520259319287,
"grad_norm": 0.38888200892854763,
"learning_rate": 2.0428329510375838e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18158888816833496,
"step": 2350,
"valid_targets_mean": 5079.9,
"valid_targets_min": 658
},
{
"epoch": 3.8168557536466774,
"grad_norm": 0.39272999735098785,
"learning_rate": 2.0347521702296333e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17020182311534882,
"step": 2355,
"valid_targets_mean": 4373.2,
"valid_targets_min": 1442
},
{
"epoch": 3.824959481361426,
"grad_norm": 0.4232818574011928,
"learning_rate": 2.026670821887516e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16656385362148285,
"step": 2360,
"valid_targets_mean": 3902.8,
"valid_targets_min": 1268
},
{
"epoch": 3.833063209076175,
"grad_norm": 0.41216984193887707,
"learning_rate": 2.0185890379869115e-05,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17816784977912903,
"step": 2365,
"valid_targets_mean": 4348.3,
"valid_targets_min": 1358
},
{
"epoch": 3.841166936790924,
"grad_norm": 0.44398530330040875,
"learning_rate": 2.0105069505106126e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19711148738861084,
"step": 2370,
"valid_targets_mean": 3858.1,
"valid_targets_min": 953
},
{
"epoch": 3.8492706645056725,
"grad_norm": 0.4232380513339039,
"learning_rate": 2.00242469144637e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20543363690376282,
"step": 2375,
"valid_targets_mean": 4407.2,
"valid_targets_min": 965
},
{
"epoch": 3.8573743922204216,
"grad_norm": 0.3900183593026856,
"learning_rate": 1.994342392784738e-05,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16155295073986053,
"step": 2380,
"valid_targets_mean": 5209.2,
"valid_targets_min": 1626
},
{
"epoch": 3.86547811993517,
"grad_norm": 0.4382394230770189,
"learning_rate": 1.9862601865169154e-05,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19150716066360474,
"step": 2385,
"valid_targets_mean": 4058.0,
"valid_targets_min": 2171
},
{
"epoch": 3.873581847649919,
"grad_norm": 0.3915766944447351,
"learning_rate": 1.9781782046325938e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20614922046661377,
"step": 2390,
"valid_targets_mean": 5446.2,
"valid_targets_min": 2126
},
{
"epoch": 3.881685575364668,
"grad_norm": 0.412179929960335,
"learning_rate": 1.9700965791177986e-05,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1477297991514206,
"step": 2395,
"valid_targets_mean": 3787.9,
"valid_targets_min": 613
},
{
"epoch": 3.8897893030794166,
"grad_norm": 0.3690789892884091,
"learning_rate": 1.9620154419527372e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15172114968299866,
"step": 2400,
"valid_targets_mean": 4618.4,
"valid_targets_min": 1325
},
{
"epoch": 3.8978930307941653,
"grad_norm": 0.37676014543592173,
"learning_rate": 1.953934925109641e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1793600618839264,
"step": 2405,
"valid_targets_mean": 6207.1,
"valid_targets_min": 1376
},
{
"epoch": 3.9059967585089144,
"grad_norm": 0.376452620738995,
"learning_rate": 1.945855160550611e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1523461639881134,
"step": 2410,
"valid_targets_mean": 4525.1,
"valid_targets_min": 1362
},
{
"epoch": 3.914100486223663,
"grad_norm": 0.4485198814325497,
"learning_rate": 1.937776280225463e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19850586354732513,
"step": 2415,
"valid_targets_mean": 4109.6,
"valid_targets_min": 1346
},
{
"epoch": 3.9222042139384117,
"grad_norm": 0.36670050740221194,
"learning_rate": 1.929698416069571e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12801700830459595,
"step": 2420,
"valid_targets_mean": 4113.8,
"valid_targets_min": 1500
},
{
"epoch": 3.9303079416531603,
"grad_norm": 0.4351692157835089,
"learning_rate": 1.9216217000017182e-05,
"loss": 0.1633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605074107646942,
"step": 2425,
"valid_targets_mean": 4056.4,
"valid_targets_min": 931
},
{
"epoch": 3.938411669367909,
"grad_norm": 0.36574619747694626,
"learning_rate": 1.9135462639219325e-05,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689274162054062,
"step": 2430,
"valid_targets_mean": 5585.9,
"valid_targets_min": 1432
},
{
"epoch": 3.946515397082658,
"grad_norm": 0.38191010503407485,
"learning_rate": 1.905472239709343e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17569342255592346,
"step": 2435,
"valid_targets_mean": 5288.8,
"valid_targets_min": 1293
},
{
"epoch": 3.9546191247974067,
"grad_norm": 0.43597968410963234,
"learning_rate": 1.89739975922002e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510361284017563,
"step": 2440,
"valid_targets_mean": 3357.4,
"valid_targets_min": 1437
},
{
"epoch": 3.9627228525121554,
"grad_norm": 0.4065088260858607,
"learning_rate": 1.889328954284823e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20322582125663757,
"step": 2445,
"valid_targets_mean": 5177.2,
"valid_targets_min": 1809
},
{
"epoch": 3.9708265802269045,
"grad_norm": 0.40878374932726397,
"learning_rate": 1.8812599567072496e-05,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16112422943115234,
"step": 2450,
"valid_targets_mean": 4005.9,
"valid_targets_min": 1297
},
{
"epoch": 3.978930307941653,
"grad_norm": 0.38156401896539294,
"learning_rate": 1.873192898261281e-05,
"loss": 0.1675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13983334600925446,
"step": 2455,
"valid_targets_mean": 4194.0,
"valid_targets_min": 1475
},
{
"epoch": 3.987034035656402,
"grad_norm": 0.3457409189940038,
"learning_rate": 1.8651279106892317e-05,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15533336997032166,
"step": 2460,
"valid_targets_mean": 5028.2,
"valid_targets_min": 1352
},
{
"epoch": 3.995137763371151,
"grad_norm": 0.39600319716364357,
"learning_rate": 1.8570651256995933e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16132251918315887,
"step": 2465,
"valid_targets_mean": 4323.6,
"valid_targets_min": 808
},
{
"epoch": 4.003241491085899,
"grad_norm": 0.3712874056679798,
"learning_rate": 1.849004674964891e-05,
"loss": 0.1685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1383274495601654,
"step": 2470,
"valid_targets_mean": 4591.7,
"valid_targets_min": 2381
},
{
"epoch": 4.011345218800648,
"grad_norm": 0.4067132658580004,
"learning_rate": 1.840946690119528e-05,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15070272982120514,
"step": 2475,
"valid_targets_mean": 4897.0,
"valid_targets_min": 1838
},
{
"epoch": 4.019448946515397,
"grad_norm": 0.40042514051100025,
"learning_rate": 1.8328913027576373e-05,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17309023439884186,
"step": 2480,
"valid_targets_mean": 5681.7,
"valid_targets_min": 1563
},
{
"epoch": 4.0275526742301455,
"grad_norm": 0.4256429505889172,
"learning_rate": 1.824838644430934e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19765028357505798,
"step": 2485,
"valid_targets_mean": 4691.1,
"valid_targets_min": 1464
},
{
"epoch": 4.035656401944895,
"grad_norm": 0.4186562721256565,
"learning_rate": 1.8167888466465652e-05,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1643456518650055,
"step": 2490,
"valid_targets_mean": 4467.4,
"valid_targets_min": 1361
},
{
"epoch": 4.043760129659644,
"grad_norm": 0.429059584351004,
"learning_rate": 1.8087420408649596e-05,
"loss": 0.159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18240870535373688,
"step": 2495,
"valid_targets_mean": 4909.3,
"valid_targets_min": 1389
},
{
"epoch": 4.051863857374392,
"grad_norm": 0.3780733056271099,
"learning_rate": 1.8006983584976877e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14605969190597534,
"step": 2500,
"valid_targets_mean": 4654.2,
"valid_targets_min": 1355
},
{
"epoch": 4.059967585089141,
"grad_norm": 0.3846916169230815,
"learning_rate": 1.7926579309053098e-05,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16894376277923584,
"step": 2505,
"valid_targets_mean": 4829.9,
"valid_targets_min": 658
},
{
"epoch": 4.06807131280389,
"grad_norm": 0.4228920289359892,
"learning_rate": 1.7846208893952346e-05,
"loss": 0.1466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1531849503517151,
"step": 2510,
"valid_targets_mean": 4364.9,
"valid_targets_min": 1195
},
{
"epoch": 4.076175040518638,
"grad_norm": 0.37417154963610766,
"learning_rate": 1.7765873652195713e-05,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16471320390701294,
"step": 2515,
"valid_targets_mean": 5711.6,
"valid_targets_min": 2235
},
{
"epoch": 4.084278768233387,
"grad_norm": 0.41101129071151,
"learning_rate": 1.7685574895729886e-05,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15926535427570343,
"step": 2520,
"valid_targets_mean": 4601.2,
"valid_targets_min": 578
},
{
"epoch": 4.0923824959481365,
"grad_norm": 0.37464269508058695,
"learning_rate": 1.7605313935905722e-05,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16744540631771088,
"step": 2525,
"valid_targets_mean": 5294.9,
"valid_targets_min": 1516
},
{
"epoch": 4.100486223662885,
"grad_norm": 0.39631540471893606,
"learning_rate": 1.7525092083456795e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17988884449005127,
"step": 2530,
"valid_targets_mean": 5167.6,
"valid_targets_min": 1413
},
{
"epoch": 4.108589951377634,
"grad_norm": 0.3970097082477904,
"learning_rate": 1.744491064847805e-05,
"loss": 0.1649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14189140498638153,
"step": 2535,
"valid_targets_mean": 4496.8,
"valid_targets_min": 1527
},
{
"epoch": 4.116693679092383,
"grad_norm": 0.4092664053834939,
"learning_rate": 1.7364770940404375e-05,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12488947808742523,
"step": 2540,
"valid_targets_mean": 3773.7,
"valid_targets_min": 1358
},
{
"epoch": 4.124797406807131,
"grad_norm": 0.4108401889537438,
"learning_rate": 1.7284674267989213e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1261243373155594,
"step": 2545,
"valid_targets_mean": 3507.6,
"valid_targets_min": 300
},
{
"epoch": 4.13290113452188,
"grad_norm": 0.42068807609354025,
"learning_rate": 1.72046219392832e-05,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15615776181221008,
"step": 2550,
"valid_targets_mean": 4401.0,
"valid_targets_min": 2435
},
{
"epoch": 4.1410048622366284,
"grad_norm": 0.4504609491464449,
"learning_rate": 1.712461526161279e-05,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1747884750366211,
"step": 2555,
"valid_targets_mean": 4031.8,
"valid_targets_min": 688
},
{
"epoch": 4.1491085899513775,
"grad_norm": 0.5275595272741159,
"learning_rate": 1.7044655541558934e-05,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14213520288467407,
"step": 2560,
"valid_targets_mean": 2747.8,
"valid_targets_min": 931
},
{
"epoch": 4.157212317666127,
"grad_norm": 0.4071729089384716,
"learning_rate": 1.69647440849357e-05,
"loss": 0.1706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16947373747825623,
"step": 2565,
"valid_targets_mean": 4519.0,
"valid_targets_min": 1346
},
{
"epoch": 4.165316045380875,
"grad_norm": 0.3737831947406853,
"learning_rate": 1.6884882196768985e-05,
"loss": 0.1471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13542313873767853,
"step": 2570,
"valid_targets_mean": 4573.9,
"valid_targets_min": 1316
},
{
"epoch": 4.173419773095624,
"grad_norm": 0.39623962224896625,
"learning_rate": 1.680507118127518e-05,
"loss": 0.1629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1541873961687088,
"step": 2575,
"valid_targets_mean": 4521.7,
"valid_targets_min": 1449
},
{
"epoch": 4.181523500810373,
"grad_norm": 0.4031184428238581,
"learning_rate": 1.6725312341839895e-05,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18571238219738007,
"step": 2580,
"valid_targets_mean": 5134.5,
"valid_targets_min": 1309
},
{
"epoch": 4.189627228525121,
"grad_norm": 0.4361781205053545,
"learning_rate": 1.664560698099664e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17057061195373535,
"step": 2585,
"valid_targets_mean": 4028.2,
"valid_targets_min": 1416
},
{
"epoch": 4.19773095623987,
"grad_norm": 0.4433460811120863,
"learning_rate": 1.6565956400405586e-05,
"loss": 0.1672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1968003511428833,
"step": 2590,
"valid_targets_mean": 4815.5,
"valid_targets_min": 1462
},
{
"epoch": 4.2058346839546195,
"grad_norm": 0.4117119339099135,
"learning_rate": 1.6486361900832284e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15136125683784485,
"step": 2595,
"valid_targets_mean": 4527.9,
"valid_targets_min": 1020
},
{
"epoch": 4.213938411669368,
"grad_norm": 0.36532371602338826,
"learning_rate": 1.6406824782126428e-05,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16010749340057373,
"step": 2600,
"valid_targets_mean": 6099.1,
"valid_targets_min": 1379
},
{
"epoch": 4.222042139384117,
"grad_norm": 0.39087983526982967,
"learning_rate": 1.632734634320064e-05,
"loss": 0.1367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12246764451265335,
"step": 2605,
"valid_targets_mean": 4464.7,
"valid_targets_min": 2176
},
{
"epoch": 4.230145867098866,
"grad_norm": 0.4272797365502613,
"learning_rate": 1.6247927882009256e-05,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14960479736328125,
"step": 2610,
"valid_targets_mean": 4127.4,
"valid_targets_min": 1343
},
{
"epoch": 4.238249594813614,
"grad_norm": 0.462725135810111,
"learning_rate": 1.6168570695527096e-05,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14427827298641205,
"step": 2615,
"valid_targets_mean": 3540.2,
"valid_targets_min": 1187
},
{
"epoch": 4.246353322528363,
"grad_norm": 0.36206227558488485,
"learning_rate": 1.6089276079728334e-05,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1214427500963211,
"step": 2620,
"valid_targets_mean": 4497.8,
"valid_targets_min": 1410
},
{
"epoch": 4.254457050243111,
"grad_norm": 0.40276086433073494,
"learning_rate": 1.6010045329565294e-05,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13030347228050232,
"step": 2625,
"valid_targets_mean": 3962.0,
"valid_targets_min": 1434
},
{
"epoch": 4.2625607779578605,
"grad_norm": 0.4387160089339799,
"learning_rate": 1.5930879738947328e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14297866821289062,
"step": 2630,
"valid_targets_mean": 3749.6,
"valid_targets_min": 1432
},
{
"epoch": 4.27066450567261,
"grad_norm": 0.372668862412784,
"learning_rate": 1.585178060071966e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14359818398952484,
"step": 2635,
"valid_targets_mean": 5299.0,
"valid_targets_min": 1386
},
{
"epoch": 4.278768233387358,
"grad_norm": 0.4146704722785337,
"learning_rate": 1.5772749206642296e-05,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1508176326751709,
"step": 2640,
"valid_targets_mean": 4494.6,
"valid_targets_min": 2469
},
{
"epoch": 4.286871961102107,
"grad_norm": 0.4054725189068471,
"learning_rate": 1.5693786847368918e-05,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13715773820877075,
"step": 2645,
"valid_targets_mean": 5204.2,
"valid_targets_min": 2589
},
{
"epoch": 4.294975688816856,
"grad_norm": 0.39034530846194615,
"learning_rate": 1.5614894812425806e-05,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12854069471359253,
"step": 2650,
"valid_targets_mean": 4378.7,
"valid_targets_min": 1333
},
{
"epoch": 4.303079416531604,
"grad_norm": 0.36953410992638486,
"learning_rate": 1.5536074390190786e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1475868672132492,
"step": 2655,
"valid_targets_mean": 5126.3,
"valid_targets_min": 1363
},
{
"epoch": 4.311183144246353,
"grad_norm": 0.4138943659186782,
"learning_rate": 1.5457326867872177e-05,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13638821244239807,
"step": 2660,
"valid_targets_mean": 4109.2,
"valid_targets_min": 1395
},
{
"epoch": 4.319286871961102,
"grad_norm": 0.34666953149423,
"learning_rate": 1.5378653531487784e-05,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447892189025879,
"step": 2665,
"valid_targets_mean": 6002.4,
"valid_targets_min": 1608
},
{
"epoch": 4.327390599675851,
"grad_norm": 0.4287979661216327,
"learning_rate": 1.5300055665843875e-05,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15963557362556458,
"step": 2670,
"valid_targets_mean": 4144.3,
"valid_targets_min": 1361
},
{
"epoch": 4.3354943273906,
"grad_norm": 0.38789554239222346,
"learning_rate": 1.5221534554514225e-05,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15133854746818542,
"step": 2675,
"valid_targets_mean": 5058.6,
"valid_targets_min": 720
},
{
"epoch": 4.343598055105349,
"grad_norm": 0.3826558850319014,
"learning_rate": 1.5143091479819146e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11236849427223206,
"step": 2680,
"valid_targets_mean": 4173.0,
"valid_targets_min": 1376
},
{
"epoch": 4.351701782820097,
"grad_norm": 0.41350564769635967,
"learning_rate": 1.5064727722804531e-05,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1576721966266632,
"step": 2685,
"valid_targets_mean": 4335.1,
"valid_targets_min": 736
},
{
"epoch": 4.359805510534846,
"grad_norm": 0.43428870276985304,
"learning_rate": 1.4986444563220948e-05,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15112698078155518,
"step": 2690,
"valid_targets_mean": 4689.3,
"valid_targets_min": 1463
},
{
"epoch": 4.367909238249595,
"grad_norm": 0.37636298776027244,
"learning_rate": 1.4908243279502741e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15192727744579315,
"step": 2695,
"valid_targets_mean": 5081.8,
"valid_targets_min": 1286
},
{
"epoch": 4.376012965964343,
"grad_norm": 0.4397966263657783,
"learning_rate": 1.4830125148747138e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20267480611801147,
"step": 2700,
"valid_targets_mean": 4718.6,
"valid_targets_min": 1545
},
{
"epoch": 4.3841166936790925,
"grad_norm": 0.43697570472069147,
"learning_rate": 1.475209144669341e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17748787999153137,
"step": 2705,
"valid_targets_mean": 4454.5,
"valid_targets_min": 678
},
{
"epoch": 4.392220421393841,
"grad_norm": 0.40519216103231753,
"learning_rate": 1.4674143447702036e-05,
"loss": 0.1443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14861005544662476,
"step": 2710,
"valid_targets_mean": 4173.1,
"valid_targets_min": 1378
},
{
"epoch": 4.40032414910859,
"grad_norm": 0.4149261608469548,
"learning_rate": 1.4596282424733877e-05,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14318136870861053,
"step": 2715,
"valid_targets_mean": 3568.0,
"valid_targets_min": 1307
},
{
"epoch": 4.408427876823339,
"grad_norm": 0.413620830401606,
"learning_rate": 1.4518509649329406e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13617044687271118,
"step": 2720,
"valid_targets_mean": 4053.7,
"valid_targets_min": 1375
},
{
"epoch": 4.416531604538087,
"grad_norm": 0.4139055830438707,
"learning_rate": 1.4440826391587926e-05,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15039443969726562,
"step": 2725,
"valid_targets_mean": 4649.6,
"valid_targets_min": 1379
},
{
"epoch": 4.424635332252836,
"grad_norm": 0.38376787901494286,
"learning_rate": 1.4363233920146855e-05,
"loss": 0.132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11790202558040619,
"step": 2730,
"valid_targets_mean": 4379.2,
"valid_targets_min": 1343
},
{
"epoch": 4.432739059967585,
"grad_norm": 0.4083381210433433,
"learning_rate": 1.4285733502160955e-05,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14305062592029572,
"step": 2735,
"valid_targets_mean": 4222.9,
"valid_targets_min": 2249
},
{
"epoch": 4.4408427876823335,
"grad_norm": 0.43656908504947634,
"learning_rate": 1.4208326403281702e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16906528174877167,
"step": 2740,
"valid_targets_mean": 4419.1,
"valid_targets_min": 1353
},
{
"epoch": 4.448946515397083,
"grad_norm": 0.4003934548959086,
"learning_rate": 1.4131013887636576e-05,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15742376446723938,
"step": 2745,
"valid_targets_mean": 4827.4,
"valid_targets_min": 614
},
{
"epoch": 4.457050243111832,
"grad_norm": 0.3840972375272,
"learning_rate": 1.4053797217808432e-05,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20730182528495789,
"step": 2750,
"valid_targets_mean": 6605.8,
"valid_targets_min": 1338
},
{
"epoch": 4.46515397082658,
"grad_norm": 0.51490729353896,
"learning_rate": 1.3976677654814866e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1762509047985077,
"step": 2755,
"valid_targets_mean": 3084.2,
"valid_targets_min": 572
},
{
"epoch": 4.473257698541329,
"grad_norm": 0.4120105039229711,
"learning_rate": 1.3899656458087647e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13307833671569824,
"step": 2760,
"valid_targets_mean": 4038.2,
"valid_targets_min": 1362
},
{
"epoch": 4.481361426256078,
"grad_norm": 0.4154926074325571,
"learning_rate": 1.3822734885452136e-05,
"loss": 0.1596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15126535296440125,
"step": 2765,
"valid_targets_mean": 4166.2,
"valid_targets_min": 1250
},
{
"epoch": 4.489465153970826,
"grad_norm": 0.42575125176208933,
"learning_rate": 1.3745914193106715e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1594770848751068,
"step": 2770,
"valid_targets_mean": 4068.7,
"valid_targets_min": 1298
},
{
"epoch": 4.4975688816855754,
"grad_norm": 0.5353069360545429,
"learning_rate": 1.366919563560233e-05,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2269129455089569,
"step": 2775,
"valid_targets_mean": 3735.1,
"valid_targets_min": 1960
},
{
"epoch": 4.5056726094003245,
"grad_norm": 0.4379484746796353,
"learning_rate": 1.3592580465821956e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17367328703403473,
"step": 2780,
"valid_targets_mean": 3981.8,
"valid_targets_min": 1401
},
{
"epoch": 4.513776337115073,
"grad_norm": 0.4081571600651165,
"learning_rate": 1.3516069934960174e-05,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1333627998828888,
"step": 2785,
"valid_targets_mean": 4328.7,
"valid_targets_min": 1463
},
{
"epoch": 4.521880064829822,
"grad_norm": 0.4401935424136,
"learning_rate": 1.3439665292502695e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17039506137371063,
"step": 2790,
"valid_targets_mean": 4571.1,
"valid_targets_min": 1123
},
{
"epoch": 4.52998379254457,
"grad_norm": 0.4136394241777246,
"learning_rate": 1.3363367786205985e-05,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1595153957605362,
"step": 2795,
"valid_targets_mean": 4450.9,
"valid_targets_min": 1255
},
{
"epoch": 4.538087520259319,
"grad_norm": 0.4715376806814763,
"learning_rate": 1.3287178662076893e-05,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17418047785758972,
"step": 2800,
"valid_targets_mean": 3706.5,
"valid_targets_min": 1336
},
{
"epoch": 4.546191247974068,
"grad_norm": 0.4080114691839976,
"learning_rate": 1.3211099164352261e-05,
"loss": 0.1488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1426158845424652,
"step": 2805,
"valid_targets_mean": 4454.5,
"valid_targets_min": 1403
},
{
"epoch": 4.5542949756888165,
"grad_norm": 0.40195595415999114,
"learning_rate": 1.3135130535478655e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.172957181930542,
"step": 2810,
"valid_targets_mean": 5329.9,
"valid_targets_min": 2400
},
{
"epoch": 4.562398703403566,
"grad_norm": 0.4043689543889982,
"learning_rate": 1.3059274016092057e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1621810793876648,
"step": 2815,
"valid_targets_mean": 4751.9,
"valid_targets_min": 2420
},
{
"epoch": 4.570502431118315,
"grad_norm": 0.40706944938964373,
"learning_rate": 1.2983530844997585e-05,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14708778262138367,
"step": 2820,
"valid_targets_mean": 4328.3,
"valid_targets_min": 1470
},
{
"epoch": 4.578606158833063,
"grad_norm": 0.44577995316271046,
"learning_rate": 1.2907902259149287e-05,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14407837390899658,
"step": 2825,
"valid_targets_mean": 3709.7,
"valid_targets_min": 1358
},
{
"epoch": 4.586709886547812,
"grad_norm": 0.43153844741457964,
"learning_rate": 1.2832389493629928e-05,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1508851945400238,
"step": 2830,
"valid_targets_mean": 4266.7,
"valid_targets_min": 1377
},
{
"epoch": 4.594813614262561,
"grad_norm": 0.4876086623263469,
"learning_rate": 1.275699378163083e-05,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14464884996414185,
"step": 2835,
"valid_targets_mean": 3399.9,
"valid_targets_min": 1327
},
{
"epoch": 4.602917341977309,
"grad_norm": 0.44880362000133106,
"learning_rate": 1.2681716354431704e-05,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15762996673583984,
"step": 2840,
"valid_targets_mean": 3883.4,
"valid_targets_min": 475
},
{
"epoch": 4.611021069692058,
"grad_norm": 0.38675466641560363,
"learning_rate": 1.2606558441380587e-05,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15953296422958374,
"step": 2845,
"valid_targets_mean": 4840.3,
"valid_targets_min": 1133
},
{
"epoch": 4.6191247974068075,
"grad_norm": 0.472879228012513,
"learning_rate": 1.2531521269873736e-05,
"loss": 0.1409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15060774981975555,
"step": 2850,
"valid_targets_mean": 3850.8,
"valid_targets_min": 1299
},
{
"epoch": 4.627228525121556,
"grad_norm": 0.42192553939479277,
"learning_rate": 1.245660606533559e-05,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17877057194709778,
"step": 2855,
"valid_targets_mean": 4635.9,
"valid_targets_min": 2261
},
{
"epoch": 4.635332252836305,
"grad_norm": 0.4117654319469982,
"learning_rate": 1.2381814051198751e-05,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1610351800918579,
"step": 2860,
"valid_targets_mean": 4523.1,
"valid_targets_min": 1408
},
{
"epoch": 4.643435980551054,
"grad_norm": 0.40499109611733797,
"learning_rate": 1.2307146448884021e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20495977997779846,
"step": 2865,
"valid_targets_mean": 6101.8,
"valid_targets_min": 2508
},
{
"epoch": 4.651539708265802,
"grad_norm": 0.3999011523794404,
"learning_rate": 1.2232604477780445e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15106816589832306,
"step": 2870,
"valid_targets_mean": 4945.2,
"valid_targets_min": 2132
},
{
"epoch": 4.659643435980551,
"grad_norm": 0.43766033396391785,
"learning_rate": 1.2158189355225382e-05,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16236332058906555,
"step": 2875,
"valid_targets_mean": 4062.0,
"valid_targets_min": 1376
},
{
"epoch": 4.667747163695299,
"grad_norm": 0.4352998986314373,
"learning_rate": 1.2083902296484659e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1306292861700058,
"step": 2880,
"valid_targets_mean": 3636.9,
"valid_targets_min": 1333
},
{
"epoch": 4.6758508914100485,
"grad_norm": 0.4010496520874604,
"learning_rate": 1.2009744514732698e-05,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12262415140867233,
"step": 2885,
"valid_targets_mean": 4299.4,
"valid_targets_min": 1561
},
{
"epoch": 4.683954619124798,
"grad_norm": 0.4326404264916919,
"learning_rate": 1.1935717221032707e-05,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14637967944145203,
"step": 2890,
"valid_targets_mean": 4200.1,
"valid_targets_min": 1452
},
{
"epoch": 4.692058346839546,
"grad_norm": 0.37813017019777695,
"learning_rate": 1.1861821624316916e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19159114360809326,
"step": 2895,
"valid_targets_mean": 5756.8,
"valid_targets_min": 1276
},
{
"epoch": 4.700162074554295,
"grad_norm": 0.4516279524948185,
"learning_rate": 1.1788058931366822e-05,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15397486090660095,
"step": 2900,
"valid_targets_mean": 4007.5,
"valid_targets_min": 1361
},
{
"epoch": 4.708265802269044,
"grad_norm": 0.43035547891945575,
"learning_rate": 1.1714430346793479e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15408627688884735,
"step": 2905,
"valid_targets_mean": 4192.9,
"valid_targets_min": 1428
},
{
"epoch": 4.716369529983792,
"grad_norm": 0.42815560735664004,
"learning_rate": 1.1640937073017837e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12107810378074646,
"step": 2910,
"valid_targets_mean": 3664.6,
"valid_targets_min": 1463
},
{
"epoch": 4.724473257698541,
"grad_norm": 0.40919295231478586,
"learning_rate": 1.1567580310251097e-05,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1773926317691803,
"step": 2915,
"valid_targets_mean": 4703.0,
"valid_targets_min": 1690
},
{
"epoch": 4.73257698541329,
"grad_norm": 0.45522206805158383,
"learning_rate": 1.1494361256475105e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22190578281879425,
"step": 2920,
"valid_targets_mean": 4572.4,
"valid_targets_min": 1368
},
{
"epoch": 4.740680713128039,
"grad_norm": 0.5050075348237438,
"learning_rate": 1.1421281107422804e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2091386914253235,
"step": 2925,
"valid_targets_mean": 4202.2,
"valid_targets_min": 459
},
{
"epoch": 4.748784440842788,
"grad_norm": 0.4245191076711551,
"learning_rate": 1.1348341056558709e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15889310836791992,
"step": 2930,
"valid_targets_mean": 4289.3,
"valid_targets_min": 1435
},
{
"epoch": 4.756888168557537,
"grad_norm": 0.4329251764412851,
"learning_rate": 1.1275542295059384e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1462092250585556,
"step": 2935,
"valid_targets_mean": 4087.2,
"valid_targets_min": 1145
},
{
"epoch": 4.764991896272285,
"grad_norm": 0.3802982333434156,
"learning_rate": 1.1202886011794023e-05,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13929399847984314,
"step": 2940,
"valid_targets_mean": 4642.4,
"valid_targets_min": 1412
},
{
"epoch": 4.773095623987034,
"grad_norm": 0.41209636116235543,
"learning_rate": 1.1130373393305004e-05,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19231638312339783,
"step": 2945,
"valid_targets_mean": 5033.9,
"valid_targets_min": 1383
},
{
"epoch": 4.781199351701783,
"grad_norm": 0.44427285185848897,
"learning_rate": 1.1058005623788564e-05,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2078791707754135,
"step": 2950,
"valid_targets_mean": 4785.1,
"valid_targets_min": 1378
},
{
"epoch": 4.789303079416531,
"grad_norm": 0.4352310198495233,
"learning_rate": 1.0985783885075407e-05,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.150970458984375,
"step": 2955,
"valid_targets_mean": 4012.4,
"valid_targets_min": 1363
},
{
"epoch": 4.7974068071312805,
"grad_norm": 0.3848427570190768,
"learning_rate": 1.0913709356611411e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15960577130317688,
"step": 2960,
"valid_targets_mean": 5311.9,
"valid_targets_min": 1370
},
{
"epoch": 4.805510534846029,
"grad_norm": 0.44803354520963734,
"learning_rate": 1.0841783215438406e-05,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13963055610656738,
"step": 2965,
"valid_targets_mean": 3312.8,
"valid_targets_min": 1017
},
{
"epoch": 4.813614262560778,
"grad_norm": 0.3988227974129132,
"learning_rate": 1.07700066361749e-05,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15069864690303802,
"step": 2970,
"valid_targets_mean": 4787.4,
"valid_targets_min": 1391
},
{
"epoch": 4.821717990275527,
"grad_norm": 0.3915010960709381,
"learning_rate": 1.0698380790996921e-05,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1701292246580124,
"step": 2975,
"valid_targets_mean": 5517.6,
"valid_targets_min": 1286
},
{
"epoch": 4.829821717990275,
"grad_norm": 0.39542275803497334,
"learning_rate": 1.0626906849618903e-05,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18241944909095764,
"step": 2980,
"valid_targets_mean": 5030.0,
"valid_targets_min": 1287
},
{
"epoch": 4.837925445705024,
"grad_norm": 0.44683950497997893,
"learning_rate": 1.0555585979274513e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17230674624443054,
"step": 2985,
"valid_targets_mean": 4003.1,
"valid_targets_min": 1242
},
{
"epoch": 4.846029173419773,
"grad_norm": 0.4059870561390617,
"learning_rate": 1.0484419344697667e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20989492535591125,
"step": 2990,
"valid_targets_mean": 5568.2,
"valid_targets_min": 1154
},
{
"epoch": 4.854132901134522,
"grad_norm": 0.3983641471581764,
"learning_rate": 1.0413408108103445e-05,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13275814056396484,
"step": 2995,
"valid_targets_mean": 4678.1,
"valid_targets_min": 1610
},
{
"epoch": 4.862236628849271,
"grad_norm": 0.40552466865168335,
"learning_rate": 1.0342553429169163e-05,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12622925639152527,
"step": 3000,
"valid_targets_mean": 4144.2,
"valid_targets_min": 1433
},
{
"epoch": 4.87034035656402,
"grad_norm": 0.46127170144733654,
"learning_rate": 1.0271856465015388e-05,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375845968723297,
"step": 3005,
"valid_targets_mean": 3773.5,
"valid_targets_min": 1322
},
{
"epoch": 4.878444084278768,
"grad_norm": 0.4006716455638935,
"learning_rate": 1.0201318370187065e-05,
"loss": 0.1476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1406145840883255,
"step": 3010,
"valid_targets_mean": 4621.4,
"valid_targets_min": 1254
},
{
"epoch": 4.886547811993517,
"grad_norm": 0.5557739475830915,
"learning_rate": 1.0130940296634683e-05,
"loss": 0.1656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16776862740516663,
"step": 3015,
"valid_targets_mean": 5287.8,
"valid_targets_min": 1799
},
{
"epoch": 4.894651539708266,
"grad_norm": 0.4756221948224015,
"learning_rate": 1.0060723393695411e-05,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16840708255767822,
"step": 3020,
"valid_targets_mean": 4141.6,
"valid_targets_min": 1372
},
{
"epoch": 4.902755267423014,
"grad_norm": 0.42322941384456886,
"learning_rate": 9.990668808074378e-06,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16478174924850464,
"step": 3025,
"valid_targets_mean": 4635.3,
"valid_targets_min": 1330
},
{
"epoch": 4.9108589951377635,
"grad_norm": 0.5538397214115858,
"learning_rate": 9.920777683825906e-06,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16234804689884186,
"step": 3030,
"valid_targets_mean": 4091.6,
"valid_targets_min": 1426
},
{
"epoch": 4.918962722852513,
"grad_norm": 0.45256934248315905,
"learning_rate": 9.851051162334871e-06,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1707843542098999,
"step": 3035,
"valid_targets_mean": 4235.1,
"valid_targets_min": 953
},
{
"epoch": 4.927066450567261,
"grad_norm": 0.42005299538899554,
"learning_rate": 9.781490382298018e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14144930243492126,
"step": 3040,
"valid_targets_mean": 4242.2,
"valid_targets_min": 1385
},
{
"epoch": 4.93517017828201,
"grad_norm": 0.3750072233886948,
"learning_rate": 9.712096479705382e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12406253069639206,
"step": 3045,
"valid_targets_mean": 4638.4,
"valid_targets_min": 774
},
{
"epoch": 4.943273905996758,
"grad_norm": 0.45082908192768895,
"learning_rate": 9.642870587821761e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1364569514989853,
"step": 3050,
"valid_targets_mean": 3741.4,
"valid_targets_min": 1223
},
{
"epoch": 4.951377633711507,
"grad_norm": 0.3965864418534553,
"learning_rate": 9.573813837168166e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15209516882896423,
"step": 3055,
"valid_targets_mean": 4904.0,
"valid_targets_min": 2367
},
{
"epoch": 4.959481361426256,
"grad_norm": 0.39620169212275697,
"learning_rate": 9.504927355503399e-06,
"loss": 0.1468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15747293829917908,
"step": 3060,
"valid_targets_mean": 4879.3,
"valid_targets_min": 1475
},
{
"epoch": 4.9675850891410045,
"grad_norm": 0.3607647863147781,
"learning_rate": 9.436212267805591e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1285112053155899,
"step": 3065,
"valid_targets_mean": 5197.2,
"valid_targets_min": 1343
},
{
"epoch": 4.975688816855754,
"grad_norm": 0.3991247742933118,
"learning_rate": 9.367669696253885e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16575992107391357,
"step": 3070,
"valid_targets_mean": 4788.8,
"valid_targets_min": 1467
},
{
"epoch": 4.983792544570503,
"grad_norm": 0.3829873997175187,
"learning_rate": 9.299300760210059e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14778871834278107,
"step": 3075,
"valid_targets_mean": 5312.8,
"valid_targets_min": 1347
},
{
"epoch": 4.991896272285251,
"grad_norm": 0.3958938101503756,
"learning_rate": 9.231106576200268e-06,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16405248641967773,
"step": 3080,
"valid_targets_mean": 5094.3,
"valid_targets_min": 2401
},
{
"epoch": 5.0,
"grad_norm": 0.4343165631028096,
"learning_rate": 9.163088257896825e-06,
"loss": 0.1535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17925883829593658,
"step": 3085,
"valid_targets_mean": 4357.8,
"valid_targets_min": 848
},
{
"epoch": 5.008103727714749,
"grad_norm": 0.3968269887435741,
"learning_rate": 9.095246916099978e-06,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1301729828119278,
"step": 3090,
"valid_targets_mean": 4130.8,
"valid_targets_min": 1417
},
{
"epoch": 5.016207455429497,
"grad_norm": 0.3830139509562347,
"learning_rate": 9.027583658719812e-06,
"loss": 0.1474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14362263679504395,
"step": 3095,
"valid_targets_mean": 5103.4,
"valid_targets_min": 655
},
{
"epoch": 5.024311183144246,
"grad_norm": 0.47938454905224653,
"learning_rate": 8.960099590758104e-06,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18902552127838135,
"step": 3100,
"valid_targets_mean": 4781.9,
"valid_targets_min": 1409
},
{
"epoch": 5.0324149108589955,
"grad_norm": 0.4381421053581367,
"learning_rate": 8.892795814290342e-06,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15005433559417725,
"step": 3105,
"valid_targets_mean": 4429.2,
"valid_targets_min": 1444
},
{
"epoch": 5.040518638573744,
"grad_norm": 0.4876459262258521,
"learning_rate": 8.825673428447668e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13418146967887878,
"step": 3110,
"valid_targets_mean": 3204.8,
"valid_targets_min": 1485
},
{
"epoch": 5.048622366288493,
"grad_norm": 0.3989147066059561,
"learning_rate": 8.758733529398945e-06,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17128801345825195,
"step": 3115,
"valid_targets_mean": 5239.9,
"valid_targets_min": 1425
},
{
"epoch": 5.056726094003242,
"grad_norm": 0.4370280823510108,
"learning_rate": 8.691977210332892e-06,
"loss": 0.1315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11790894716978073,
"step": 3120,
"valid_targets_mean": 3613.9,
"valid_targets_min": 1034
},
{
"epoch": 5.06482982171799,
"grad_norm": 0.41568029457497896,
"learning_rate": 8.625405561440172e-06,
"loss": 0.1358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14099830389022827,
"step": 3125,
"valid_targets_mean": 4263.2,
"valid_targets_min": 1364
},
{
"epoch": 5.072933549432739,
"grad_norm": 0.42290991910310327,
"learning_rate": 8.559019669895648e-06,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1221788227558136,
"step": 3130,
"valid_targets_mean": 4256.4,
"valid_targets_min": 1474
},
{
"epoch": 5.081037277147487,
"grad_norm": 0.4702701852005545,
"learning_rate": 8.492820619840563e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15777115523815155,
"step": 3135,
"valid_targets_mean": 3536.3,
"valid_targets_min": 1438
},
{
"epoch": 5.0891410048622365,
"grad_norm": 0.4413433161733371,
"learning_rate": 8.426809492364907e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14609038829803467,
"step": 3140,
"valid_targets_mean": 3770.4,
"valid_targets_min": 1291
},
{
"epoch": 5.097244732576986,
"grad_norm": 0.4022291115099463,
"learning_rate": 8.360987365489698e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13611765205860138,
"step": 3145,
"valid_targets_mean": 4807.1,
"valid_targets_min": 1957
},
{
"epoch": 5.105348460291734,
"grad_norm": 0.44028849944004317,
"learning_rate": 8.295355314149413e-06,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1880216896533966,
"step": 3150,
"valid_targets_mean": 4639.2,
"valid_targets_min": 1273
},
{
"epoch": 5.113452188006483,
"grad_norm": 0.4105899389205008,
"learning_rate": 8.229914410174435e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14482375979423523,
"step": 3155,
"valid_targets_mean": 4465.9,
"valid_targets_min": 1511
},
{
"epoch": 5.121555915721232,
"grad_norm": 0.5313511259093264,
"learning_rate": 8.16466572227352e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16115616261959076,
"step": 3160,
"valid_targets_mean": 3309.9,
"valid_targets_min": 952
},
{
"epoch": 5.12965964343598,
"grad_norm": 0.4059132147272568,
"learning_rate": 8.099610316016373e-06,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1520155966281891,
"step": 3165,
"valid_targets_mean": 5199.4,
"valid_targets_min": 1868
},
{
"epoch": 5.137763371150729,
"grad_norm": 0.4673866325160744,
"learning_rate": 8.03474925381625e-06,
"loss": 0.1441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13583573698997498,
"step": 3170,
"valid_targets_mean": 3982.9,
"valid_targets_min": 1495
},
{
"epoch": 5.145867098865478,
"grad_norm": 0.41493588873304466,
"learning_rate": 7.97008359491257e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15901492536067963,
"step": 3175,
"valid_targets_mean": 4487.7,
"valid_targets_min": 1652
},
{
"epoch": 5.153970826580227,
"grad_norm": 0.3817364201910083,
"learning_rate": 7.905614395353649e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.169359028339386,
"step": 3180,
"valid_targets_mean": 6225.4,
"valid_targets_min": 2198
},
{
"epoch": 5.162074554294976,
"grad_norm": 0.4350949526585142,
"learning_rate": 7.841342707979442e-06,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17552366852760315,
"step": 3185,
"valid_targets_mean": 4653.2,
"valid_targets_min": 1322
},
{
"epoch": 5.170178282009725,
"grad_norm": 0.41863754898582967,
"learning_rate": 7.77726958240437e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1267434060573578,
"step": 3190,
"valid_targets_mean": 4613.6,
"valid_targets_min": 1426
},
{
"epoch": 5.178282009724473,
"grad_norm": 0.4347179314293203,
"learning_rate": 7.713396065000133e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17588908970355988,
"step": 3195,
"valid_targets_mean": 4821.8,
"valid_targets_min": 1307
},
{
"epoch": 5.186385737439222,
"grad_norm": 0.3741504502759021,
"learning_rate": 7.649723198878676e-06,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1253783404827118,
"step": 3200,
"valid_targets_mean": 5491.1,
"valid_targets_min": 701
},
{
"epoch": 5.194489465153971,
"grad_norm": 0.4167609797093036,
"learning_rate": 7.586252023875125e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17448574304580688,
"step": 3205,
"valid_targets_mean": 4872.2,
"valid_targets_min": 1235
},
{
"epoch": 5.2025931928687195,
"grad_norm": 0.49274119267513306,
"learning_rate": 7.522983576530791e-06,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1333792507648468,
"step": 3210,
"valid_targets_mean": 3084.2,
"valid_targets_min": 1346
},
{
"epoch": 5.210696920583469,
"grad_norm": 0.4274907703145893,
"learning_rate": 7.459918890076272e-06,
"loss": 0.1403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13575004041194916,
"step": 3215,
"valid_targets_mean": 4470.8,
"valid_targets_min": 1264
},
{
"epoch": 5.218800648298217,
"grad_norm": 0.46411535100095974,
"learning_rate": 7.397058994414563e-06,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15877866744995117,
"step": 3220,
"valid_targets_mean": 4287.1,
"valid_targets_min": 1382
},
{
"epoch": 5.226904376012966,
"grad_norm": 0.42573424092441686,
"learning_rate": 7.3344049161042495e-06,
"loss": 0.1322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1221034973859787,
"step": 3225,
"valid_targets_mean": 4021.1,
"valid_targets_min": 1400
},
{
"epoch": 5.235008103727715,
"grad_norm": 0.4507514969839428,
"learning_rate": 7.271957678342738e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447732299566269,
"step": 3230,
"valid_targets_mean": 4574.4,
"valid_targets_min": 1330
},
{
"epoch": 5.243111831442463,
"grad_norm": 0.37145491813213954,
"learning_rate": 7.209718300949519e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309332549571991,
"step": 3235,
"valid_targets_mean": 5262.1,
"valid_targets_min": 2743
},
{
"epoch": 5.251215559157212,
"grad_norm": 0.4714945659818598,
"learning_rate": 7.14768780034957e-06,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14775560796260834,
"step": 3240,
"valid_targets_mean": 3638.2,
"valid_targets_min": 1423
},
{
"epoch": 5.259319286871961,
"grad_norm": 0.44171814267945775,
"learning_rate": 7.085867189556697e-06,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19044238328933716,
"step": 3245,
"valid_targets_mean": 4592.8,
"valid_targets_min": 1328
},
{
"epoch": 5.26742301458671,
"grad_norm": 0.42451536992860567,
"learning_rate": 7.024257478157015e-06,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13068664073944092,
"step": 3250,
"valid_targets_mean": 4324.1,
"valid_targets_min": 1433
},
{
"epoch": 5.275526742301459,
"grad_norm": 0.4655686708567891,
"learning_rate": 6.96285967229249e-06,
"loss": 0.1589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.165610671043396,
"step": 3255,
"valid_targets_mean": 3945.8,
"valid_targets_min": 1336
},
{
"epoch": 5.283630470016208,
"grad_norm": 0.4449132978595166,
"learning_rate": 6.901674774644449e-06,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18209701776504517,
"step": 3260,
"valid_targets_mean": 4861.0,
"valid_targets_min": 1069
},
{
"epoch": 5.291734197730956,
"grad_norm": 0.40137615746667976,
"learning_rate": 6.840703784417262e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1194748729467392,
"step": 3265,
"valid_targets_mean": 4572.1,
"valid_targets_min": 1018
},
{
"epoch": 5.299837925445705,
"grad_norm": 0.4359004956729294,
"learning_rate": 6.779947697321974e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16937534511089325,
"step": 3270,
"valid_targets_mean": 4552.4,
"valid_targets_min": 1345
},
{
"epoch": 5.307941653160454,
"grad_norm": 0.4724067916024582,
"learning_rate": 6.719407505560094e-06,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1636667549610138,
"step": 3275,
"valid_targets_mean": 4430.4,
"valid_targets_min": 1409
},
{
"epoch": 5.316045380875202,
"grad_norm": 0.44441044209123404,
"learning_rate": 6.659084197807348e-06,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16976942121982574,
"step": 3280,
"valid_targets_mean": 4312.1,
"valid_targets_min": 1353
},
{
"epoch": 5.3241491085899515,
"grad_norm": 0.4150836959257879,
"learning_rate": 6.598978759197554e-06,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11863559484481812,
"step": 3285,
"valid_targets_mean": 3961.8,
"valid_targets_min": 1429
},
{
"epoch": 5.332252836304701,
"grad_norm": 0.4119131054274552,
"learning_rate": 6.539092171306541e-06,
"loss": 0.1478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15804126858711243,
"step": 3290,
"valid_targets_mean": 4975.1,
"valid_targets_min": 1620
},
{
"epoch": 5.340356564019449,
"grad_norm": 0.4431169860534305,
"learning_rate": 6.479425412136093e-06,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13536761701107025,
"step": 3295,
"valid_targets_mean": 3993.5,
"valid_targets_min": 1020
},
{
"epoch": 5.348460291734198,
"grad_norm": 0.40748142947812366,
"learning_rate": 6.419979456098016e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14843331277370453,
"step": 3300,
"valid_targets_mean": 4888.7,
"valid_targets_min": 572
},
{
"epoch": 5.356564019448946,
"grad_norm": 0.38063983350274677,
"learning_rate": 6.360755273998174e-06,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13254444301128387,
"step": 3305,
"valid_targets_mean": 5138.4,
"valid_targets_min": 2549
},
{
"epoch": 5.364667747163695,
"grad_norm": 0.41858383988280357,
"learning_rate": 6.301753833020691e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1635013222694397,
"step": 3310,
"valid_targets_mean": 5046.3,
"valid_targets_min": 2402
},
{
"epoch": 5.372771474878444,
"grad_norm": 0.47226938264774465,
"learning_rate": 6.242976096712112e-06,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14795152842998505,
"step": 3315,
"valid_targets_mean": 3503.7,
"valid_targets_min": 1286
},
{
"epoch": 5.3808752025931925,
"grad_norm": 0.41899647955888863,
"learning_rate": 6.18442302496568e-06,
"loss": 0.14,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15799807012081146,
"step": 3320,
"valid_targets_mean": 4453.1,
"valid_targets_min": 1332
},
{
"epoch": 5.388978930307942,
"grad_norm": 0.4445100748493841,
"learning_rate": 6.1260955740056835e-06,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12522292137145996,
"step": 3325,
"valid_targets_mean": 3427.6,
"valid_targets_min": 1299
},
{
"epoch": 5.397082658022691,
"grad_norm": 0.4442798105619433,
"learning_rate": 6.067994696371797e-06,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17335715889930725,
"step": 3330,
"valid_targets_mean": 4862.9,
"valid_targets_min": 1227
},
{
"epoch": 5.405186385737439,
"grad_norm": 0.42669050164619443,
"learning_rate": 6.010121340903574e-06,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13971629738807678,
"step": 3335,
"valid_targets_mean": 4265.6,
"valid_targets_min": 1599
},
{
"epoch": 5.413290113452188,
"grad_norm": 0.424049644257688,
"learning_rate": 5.952476452724898e-06,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1421208679676056,
"step": 3340,
"valid_targets_mean": 4199.8,
"valid_targets_min": 1370
},
{
"epoch": 5.421393841166937,
"grad_norm": 0.39489552858065036,
"learning_rate": 5.895060973228606e-06,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596226692199707,
"step": 3345,
"valid_targets_mean": 5840.3,
"valid_targets_min": 1379
},
{
"epoch": 5.429497568881685,
"grad_norm": 0.3971053859954934,
"learning_rate": 5.837875840061064e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.152027428150177,
"step": 3350,
"valid_targets_mean": 5854.6,
"valid_targets_min": 2489
},
{
"epoch": 5.437601296596434,
"grad_norm": 0.42180726865326074,
"learning_rate": 5.780921987106878e-06,
"loss": 0.1451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1312631070613861,
"step": 3355,
"valid_targets_mean": 4105.1,
"valid_targets_min": 1417
},
{
"epoch": 5.4457050243111835,
"grad_norm": 0.4268852043834351,
"learning_rate": 5.724200344473651e-06,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14172303676605225,
"step": 3360,
"valid_targets_mean": 4448.6,
"valid_targets_min": 2495
},
{
"epoch": 5.453808752025932,
"grad_norm": 0.4342642841720189,
"learning_rate": 5.66771183847677e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14243818819522858,
"step": 3365,
"valid_targets_mean": 4433.8,
"valid_targets_min": 2387
},
{
"epoch": 5.461912479740681,
"grad_norm": 0.4642434978963273,
"learning_rate": 5.611457391624309e-06,
"loss": 0.1567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18304626643657684,
"step": 3370,
"valid_targets_mean": 4033.4,
"valid_targets_min": 1502
},
{
"epoch": 5.47001620745543,
"grad_norm": 0.4127896613433934,
"learning_rate": 5.555437922601918e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505068838596344,
"step": 3375,
"valid_targets_mean": 4843.2,
"valid_targets_min": 1356
},
{
"epoch": 5.478119935170178,
"grad_norm": 0.4367679456778927,
"learning_rate": 5.499654346257879e-06,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13455377519130707,
"step": 3380,
"valid_targets_mean": 4203.2,
"valid_targets_min": 1382
},
{
"epoch": 5.486223662884927,
"grad_norm": 0.4701162288125186,
"learning_rate": 5.444107573588116e-06,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12258616089820862,
"step": 3385,
"valid_targets_mean": 3157.6,
"valid_targets_min": 1421
},
{
"epoch": 5.4943273905996755,
"grad_norm": 0.4412200000803221,
"learning_rate": 5.388798511721329e-06,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1565963327884674,
"step": 3390,
"valid_targets_mean": 4411.5,
"valid_targets_min": 459
},
{
"epoch": 5.5024311183144246,
"grad_norm": 0.3600623889453669,
"learning_rate": 5.333728063904213e-06,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14468525350093842,
"step": 3395,
"valid_targets_mean": 5956.2,
"valid_targets_min": 1337
},
{
"epoch": 5.510534846029174,
"grad_norm": 0.4598981790632925,
"learning_rate": 5.278897129486656e-06,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14410819113254547,
"step": 3400,
"valid_targets_mean": 3575.8,
"valid_targets_min": 1436
},
{
"epoch": 5.518638573743922,
"grad_norm": 0.4580690381488814,
"learning_rate": 5.224306603907095e-06,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18686503171920776,
"step": 3405,
"valid_targets_mean": 4421.5,
"valid_targets_min": 844
},
{
"epoch": 5.526742301458671,
"grad_norm": 0.40648216673551496,
"learning_rate": 5.169957378677859e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16417232155799866,
"step": 3410,
"valid_targets_mean": 5176.2,
"valid_targets_min": 1453
},
{
"epoch": 5.53484602917342,
"grad_norm": 0.42527715899312485,
"learning_rate": 5.11585034137064e-06,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14472799003124237,
"step": 3415,
"valid_targets_mean": 4337.4,
"valid_targets_min": 1441
},
{
"epoch": 5.542949756888168,
"grad_norm": 0.4257643164617211,
"learning_rate": 5.061986375601977e-06,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1356392502784729,
"step": 3420,
"valid_targets_mean": 4046.2,
"valid_targets_min": 1496
},
{
"epoch": 5.551053484602917,
"grad_norm": 0.3765615482008815,
"learning_rate": 5.0083663610188215e-06,
"loss": 0.1357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11371708661317825,
"step": 3425,
"valid_targets_mean": 5338.3,
"valid_targets_min": 953
},
{
"epoch": 5.5591572123176665,
"grad_norm": 0.3964517008546095,
"learning_rate": 4.954991173284207e-06,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15065959095954895,
"step": 3430,
"valid_targets_mean": 5702.8,
"valid_targets_min": 1311
},
{
"epoch": 5.567260940032415,
"grad_norm": 0.4508220930947401,
"learning_rate": 4.901861684062899e-06,
"loss": 0.1398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1419251263141632,
"step": 3435,
"valid_targets_mean": 4317.9,
"valid_targets_min": 1380
},
{
"epoch": 5.575364667747164,
"grad_norm": 0.38660509987607483,
"learning_rate": 4.848978761007206e-06,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1457797884941101,
"step": 3440,
"valid_targets_mean": 5160.2,
"valid_targets_min": 1217
},
{
"epoch": 5.583468395461912,
"grad_norm": 0.38807504896802625,
"learning_rate": 4.796343267742782e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1514224410057068,
"step": 3445,
"valid_targets_mean": 5379.7,
"valid_targets_min": 1357
},
{
"epoch": 5.591572123176661,
"grad_norm": 0.46275031225232527,
"learning_rate": 4.743956063854529e-06,
"loss": 0.1333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1503310203552246,
"step": 3450,
"valid_targets_mean": 3940.9,
"valid_targets_min": 1426
},
{
"epoch": 5.59967585089141,
"grad_norm": 0.4452707900888768,
"learning_rate": 4.691818004872557e-06,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14793214201927185,
"step": 3455,
"valid_targets_mean": 4227.8,
"valid_targets_min": 1309
},
{
"epoch": 5.607779578606159,
"grad_norm": 0.41732278622886226,
"learning_rate": 4.639929942258217e-06,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15394923090934753,
"step": 3460,
"valid_targets_mean": 4887.3,
"valid_targets_min": 1363
},
{
"epoch": 5.6158833063209075,
"grad_norm": 0.3755320355039727,
"learning_rate": 4.588292723390204e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14299200475215912,
"step": 3465,
"valid_targets_mean": 4793.9,
"valid_targets_min": 1847
},
{
"epoch": 5.623987034035657,
"grad_norm": 0.4068035472698011,
"learning_rate": 4.536907191550694e-06,
"loss": 0.1521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16701841354370117,
"step": 3470,
"valid_targets_mean": 5323.9,
"valid_targets_min": 2438
},
{
"epoch": 5.632090761750405,
"grad_norm": 0.4033726053317685,
"learning_rate": 4.4857741859116024e-06,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14929088950157166,
"step": 3475,
"valid_targets_mean": 5282.5,
"valid_targets_min": 1223
},
{
"epoch": 5.640194489465154,
"grad_norm": 0.4361679512957998,
"learning_rate": 4.434894541520862e-06,
"loss": 0.1533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16081160306930542,
"step": 3480,
"valid_targets_mean": 5153.8,
"valid_targets_min": 2145
},
{
"epoch": 5.648298217179903,
"grad_norm": 0.4767583735219021,
"learning_rate": 4.3842690892887795e-06,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14562401175498962,
"step": 3485,
"valid_targets_mean": 3356.0,
"valid_targets_min": 1391
},
{
"epoch": 5.656401944894651,
"grad_norm": 0.40801873437269603,
"learning_rate": 4.333898655974484e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1436278223991394,
"step": 3490,
"valid_targets_mean": 5208.7,
"valid_targets_min": 2539
},
{
"epoch": 5.6645056726094,
"grad_norm": 0.39494427065104426,
"learning_rate": 4.283784064172405e-06,
"loss": 0.1417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1220889762043953,
"step": 3495,
"valid_targets_mean": 4590.6,
"valid_targets_min": 1449
},
{
"epoch": 5.672609400324149,
"grad_norm": 0.3727393025793469,
"learning_rate": 4.233926132298867e-06,
"loss": 0.142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12601833045482635,
"step": 3500,
"valid_targets_mean": 5080.4,
"valid_targets_min": 1314
},
{
"epoch": 5.680713128038898,
"grad_norm": 0.4579620633493333,
"learning_rate": 4.1843256745787e-06,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14137154817581177,
"step": 3505,
"valid_targets_mean": 4364.9,
"valid_targets_min": 1103
},
{
"epoch": 5.688816855753647,
"grad_norm": 0.4210006457716337,
"learning_rate": 4.134983501031942e-06,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14210812747478485,
"step": 3510,
"valid_targets_mean": 4854.4,
"valid_targets_min": 1520
},
{
"epoch": 5.696920583468396,
"grad_norm": 0.44180877138160274,
"learning_rate": 4.085900417460633e-06,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17552919685840607,
"step": 3515,
"valid_targets_mean": 4908.9,
"valid_targets_min": 1473
},
{
"epoch": 5.705024311183144,
"grad_norm": 0.44830779855225567,
"learning_rate": 4.037077225435628e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12323147058486938,
"step": 3520,
"valid_targets_mean": 3771.7,
"valid_targets_min": 1324
},
{
"epoch": 5.713128038897893,
"grad_norm": 0.37678935263590063,
"learning_rate": 3.988514722283523e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12797431647777557,
"step": 3525,
"valid_targets_mean": 5230.3,
"valid_targets_min": 2085
},
{
"epoch": 5.721231766612641,
"grad_norm": 0.43358458671138017,
"learning_rate": 3.940213701073636e-06,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17389845848083496,
"step": 3530,
"valid_targets_mean": 4511.4,
"valid_targets_min": 1178
},
{
"epoch": 5.72933549432739,
"grad_norm": 0.46038006750182087,
"learning_rate": 3.892174950605039e-06,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14572468400001526,
"step": 3535,
"valid_targets_mean": 4509.4,
"valid_targets_min": 1453
},
{
"epoch": 5.7374392220421395,
"grad_norm": 0.4492541988440627,
"learning_rate": 3.844399255393705e-06,
"loss": 0.1513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724633127450943,
"step": 3540,
"valid_targets_mean": 4466.0,
"valid_targets_min": 1992
},
{
"epoch": 5.745542949756889,
"grad_norm": 0.4795417181415384,
"learning_rate": 3.7968873956596563e-06,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21007636189460754,
"step": 3545,
"valid_targets_mean": 4530.2,
"valid_targets_min": 676
},
{
"epoch": 5.753646677471637,
"grad_norm": 0.46983777722992826,
"learning_rate": 3.749640147314264e-06,
"loss": 0.1344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1398407220840454,
"step": 3550,
"valid_targets_mean": 3593.2,
"valid_targets_min": 1362
},
{
"epoch": 5.761750405186386,
"grad_norm": 0.38049959215799295,
"learning_rate": 3.7026582819475443e-06,
"loss": 0.1455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12801112234592438,
"step": 3555,
"valid_targets_mean": 4737.4,
"valid_targets_min": 2235
},
{
"epoch": 5.769854132901134,
"grad_norm": 0.461054141076095,
"learning_rate": 3.6559425668155733e-06,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17298737168312073,
"step": 3560,
"valid_targets_mean": 3996.0,
"valid_targets_min": 578
},
{
"epoch": 5.777957860615883,
"grad_norm": 0.4360822162589034,
"learning_rate": 3.6094937648279647e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14468207955360413,
"step": 3565,
"valid_targets_mean": 4477.3,
"valid_targets_min": 1338
},
{
"epoch": 5.786061588330632,
"grad_norm": 0.4418639601057002,
"learning_rate": 3.563312634535383e-06,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.174360454082489,
"step": 3570,
"valid_targets_mean": 4328.9,
"valid_targets_min": 1142
},
{
"epoch": 5.7941653160453805,
"grad_norm": 0.43052400582331984,
"learning_rate": 3.517399930117196e-06,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16029515862464905,
"step": 3575,
"valid_targets_mean": 4829.5,
"valid_targets_min": 2103
},
{
"epoch": 5.80226904376013,
"grad_norm": 0.4590780539905914,
"learning_rate": 3.4717564013691087e-06,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12398982793092728,
"step": 3580,
"valid_targets_mean": 3912.6,
"valid_targets_min": 1397
},
{
"epoch": 5.810372771474879,
"grad_norm": 0.4078367715005851,
"learning_rate": 3.4263827936909744e-06,
"loss": 0.1435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16300195455551147,
"step": 3585,
"valid_targets_mean": 5371.7,
"valid_targets_min": 1463
},
{
"epoch": 5.818476499189627,
"grad_norm": 0.41245112010062046,
"learning_rate": 3.38127984807457e-06,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1823018491268158,
"step": 3590,
"valid_targets_mean": 5383.8,
"valid_targets_min": 1390
},
{
"epoch": 5.826580226904376,
"grad_norm": 0.41228359986338586,
"learning_rate": 3.3364483010915237e-06,
"loss": 0.1528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16868922114372253,
"step": 3595,
"valid_targets_mean": 5036.3,
"valid_targets_min": 1354
},
{
"epoch": 5.834683954619125,
"grad_norm": 0.4025206613962,
"learning_rate": 3.2918888848812913e-06,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1353769749403,
"step": 3600,
"valid_targets_mean": 4976.0,
"valid_targets_min": 2813
},
{
"epoch": 5.842787682333873,
"grad_norm": 0.4173151097140713,
"learning_rate": 3.2476023271391698e-06,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375451683998108,
"step": 3605,
"valid_targets_mean": 4525.1,
"valid_targets_min": 782
},
{
"epoch": 5.8508914100486225,
"grad_norm": 0.4600876492050453,
"learning_rate": 3.2035893511044524e-06,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14605942368507385,
"step": 3610,
"valid_targets_mean": 3913.0,
"valid_targets_min": 970
},
{
"epoch": 5.858995137763371,
"grad_norm": 0.3887244887549261,
"learning_rate": 3.159850675548577e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13345900177955627,
"step": 3615,
"valid_targets_mean": 4845.1,
"valid_targets_min": 1469
},
{
"epoch": 5.86709886547812,
"grad_norm": 0.42651798816381464,
"learning_rate": 3.116387014763429e-06,
"loss": 0.1397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.126625657081604,
"step": 3620,
"valid_targets_mean": 3999.2,
"valid_targets_min": 1276
},
{
"epoch": 5.875202593192869,
"grad_norm": 0.404591471586791,
"learning_rate": 3.073199078549638e-06,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14635738730430603,
"step": 3625,
"valid_targets_mean": 5098.9,
"valid_targets_min": 2199
},
{
"epoch": 5.883306320907618,
"grad_norm": 0.39164350966421785,
"learning_rate": 3.0302875722050064e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13689061999320984,
"step": 3630,
"valid_targets_mean": 5409.9,
"valid_targets_min": 1353
},
{
"epoch": 5.891410048622366,
"grad_norm": 0.40314319994514747,
"learning_rate": 2.987653196513003e-06,
"loss": 0.1386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12066174298524857,
"step": 3635,
"valid_targets_mean": 4769.4,
"valid_targets_min": 1481
},
{
"epoch": 5.899513776337115,
"grad_norm": 0.4836471889303801,
"learning_rate": 2.9452966477312815e-06,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16042715311050415,
"step": 3640,
"valid_targets_mean": 3923.6,
"valid_targets_min": 715
},
{
"epoch": 5.9076175040518635,
"grad_norm": 0.46089519237408594,
"learning_rate": 2.9032186175803545e-06,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20133355259895325,
"step": 3645,
"valid_targets_mean": 4924.5,
"valid_targets_min": 1456
},
{
"epoch": 5.915721231766613,
"grad_norm": 0.4565914501000379,
"learning_rate": 2.8614197932322585e-06,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13373398780822754,
"step": 3650,
"valid_targets_mean": 3931.9,
"valid_targets_min": 1146
},
{
"epoch": 5.923824959481362,
"grad_norm": 0.4408552819806134,
"learning_rate": 2.819900857299358e-06,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15062901377677917,
"step": 3655,
"valid_targets_mean": 4433.2,
"valid_targets_min": 2133
},
{
"epoch": 5.93192868719611,
"grad_norm": 0.3933877770279565,
"learning_rate": 2.778662487823187e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14033809304237366,
"step": 3660,
"valid_targets_mean": 5082.8,
"valid_targets_min": 1363
},
{
"epoch": 5.940032414910859,
"grad_norm": 0.4435388470880922,
"learning_rate": 2.7377053582633652e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1453082263469696,
"step": 3665,
"valid_targets_mean": 4131.4,
"valid_targets_min": 1133
},
{
"epoch": 5.948136142625608,
"grad_norm": 0.4303911052570311,
"learning_rate": 2.6970301374866337e-06,
"loss": 0.1355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13601087033748627,
"step": 3670,
"valid_targets_mean": 3857.9,
"valid_targets_min": 1394
},
{
"epoch": 5.956239870340356,
"grad_norm": 0.3821087196176658,
"learning_rate": 2.656637489755889e-06,
"loss": 0.1601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16024444997310638,
"step": 3675,
"valid_targets_mean": 6057.2,
"valid_targets_min": 2643
},
{
"epoch": 5.964343598055105,
"grad_norm": 0.47180883356979997,
"learning_rate": 2.616528074719371e-06,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1266734004020691,
"step": 3680,
"valid_targets_mean": 3223.6,
"valid_targets_min": 1354
},
{
"epoch": 5.9724473257698545,
"grad_norm": 0.42562678571064955,
"learning_rate": 2.576702547399863e-06,
"loss": 0.1407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13321202993392944,
"step": 3685,
"valid_targets_mean": 4263.2,
"valid_targets_min": 1387
},
{
"epoch": 5.980551053484603,
"grad_norm": 0.36066353182020416,
"learning_rate": 2.53716155818402e-06,
"loss": 0.1576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12179975211620331,
"step": 3690,
"valid_targets_mean": 5267.1,
"valid_targets_min": 1255
},
{
"epoch": 5.988654781199352,
"grad_norm": 0.47127497546296976,
"learning_rate": 2.49790575281172e-06,
"loss": 0.1475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15804405510425568,
"step": 3695,
"valid_targets_mean": 4068.7,
"valid_targets_min": 1112
},
{
"epoch": 5.9967585089141,
"grad_norm": 0.412154254601803,
"learning_rate": 2.4589357723655405e-06,
"loss": 0.1418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12866616249084473,
"step": 3700,
"valid_targets_mean": 4358.7,
"valid_targets_min": 1364
},
{
"epoch": 6.004862236628849,
"grad_norm": 0.4074648856856215,
"learning_rate": 2.4202522532602846e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16085468232631683,
"step": 3705,
"valid_targets_mean": 4796.6,
"valid_targets_min": 614
},
{
"epoch": 6.012965964343598,
"grad_norm": 0.3982979848177161,
"learning_rate": 2.381855827232571e-06,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11491286009550095,
"step": 3710,
"valid_targets_mean": 4550.1,
"valid_targets_min": 1490
},
{
"epoch": 6.021069692058346,
"grad_norm": 0.41195237608810253,
"learning_rate": 2.343747121330544e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12920981645584106,
"step": 3715,
"valid_targets_mean": 4646.1,
"valid_targets_min": 1293
},
{
"epoch": 6.0291734197730955,
"grad_norm": 0.3762383380804612,
"learning_rate": 2.3059267579036183e-06,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14210054278373718,
"step": 3720,
"valid_targets_mean": 5317.4,
"valid_targets_min": 2300
},
{
"epoch": 6.037277147487845,
"grad_norm": 0.4411386976702003,
"learning_rate": 2.268395354592312e-06,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23801150918006897,
"step": 3725,
"valid_targets_mean": 5265.6,
"valid_targets_min": 1380
},
{
"epoch": 6.045380875202593,
"grad_norm": 0.36386178774219285,
"learning_rate": 2.2311535243181637e-06,
"loss": 0.1381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10592524707317352,
"step": 3730,
"valid_targets_mean": 5293.6,
"valid_targets_min": 2116
},
{
"epoch": 6.053484602917342,
"grad_norm": 0.38730906481519406,
"learning_rate": 2.1942018752737227e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11556782573461533,
"step": 3735,
"valid_targets_mean": 4649.8,
"valid_targets_min": 1440
},
{
"epoch": 6.061588330632091,
"grad_norm": 0.450030924562011,
"learning_rate": 2.1575410109126293e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13595318794250488,
"step": 3740,
"valid_targets_mean": 4143.9,
"valid_targets_min": 1770
},
{
"epoch": 6.069692058346839,
"grad_norm": 0.4074205018656638,
"learning_rate": 2.121171529939734e-06,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13340912759304047,
"step": 3745,
"valid_targets_mean": 4517.4,
"valid_targets_min": 1548
},
{
"epoch": 6.077795786061588,
"grad_norm": 0.4529633278316854,
"learning_rate": 2.085094026301349e-06,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13528558611869812,
"step": 3750,
"valid_targets_mean": 3715.6,
"valid_targets_min": 1436
},
{
"epoch": 6.085899513776337,
"grad_norm": 0.4190960207519973,
"learning_rate": 2.0493090891755262e-06,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133295476436615,
"step": 3755,
"valid_targets_mean": 4487.4,
"valid_targets_min": 2011
},
{
"epoch": 6.094003241491086,
"grad_norm": 0.42452718549108076,
"learning_rate": 2.013817302962444e-06,
"loss": 0.1342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13761006295681,
"step": 3760,
"valid_targets_mean": 4643.9,
"valid_targets_min": 1444
},
{
"epoch": 6.102106969205835,
"grad_norm": 0.4272396450205022,
"learning_rate": 1.9786192472748643e-06,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13067889213562012,
"step": 3765,
"valid_targets_mean": 4262.9,
"valid_targets_min": 1406
},
{
"epoch": 6.110210696920584,
"grad_norm": 0.4182294978740752,
"learning_rate": 1.9437154969286577e-06,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13712134957313538,
"step": 3770,
"valid_targets_mean": 4474.1,
"valid_targets_min": 1402
},
{
"epoch": 6.118314424635332,
"grad_norm": 0.39799797675881166,
"learning_rate": 1.9091066219334365e-06,
"loss": 0.1354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11920727789402008,
"step": 3775,
"valid_targets_mean": 4693.6,
"valid_targets_min": 1402
},
{
"epoch": 6.126418152350081,
"grad_norm": 0.41626093816189375,
"learning_rate": 1.8747931874832325e-06,
"loss": 0.1384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12707899510860443,
"step": 3780,
"valid_targets_mean": 4307.7,
"valid_targets_min": 2364
},
{
"epoch": 6.13452188006483,
"grad_norm": 0.4565834650265614,
"learning_rate": 1.8407757539472548e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1688140332698822,
"step": 3785,
"valid_targets_mean": 4503.1,
"valid_targets_min": 1358
},
{
"epoch": 6.1426256077795784,
"grad_norm": 0.42857367927873613,
"learning_rate": 1.8070548768607744e-06,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11357726156711578,
"step": 3790,
"valid_targets_mean": 4074.0,
"valid_targets_min": 1394
},
{
"epoch": 6.1507293354943275,
"grad_norm": 0.4370185122080301,
"learning_rate": 1.773631106915996e-06,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1375211924314499,
"step": 3795,
"valid_targets_mean": 4234.0,
"valid_targets_min": 1432
},
{
"epoch": 6.158833063209076,
"grad_norm": 0.4109496720135297,
"learning_rate": 1.740504989953129e-06,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.120418019592762,
"step": 3800,
"valid_targets_mean": 4492.1,
"valid_targets_min": 676
},
{
"epoch": 6.166936790923825,
"grad_norm": 0.4439327368735157,
"learning_rate": 1.707677066951432e-06,
"loss": 0.1473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12108451128005981,
"step": 3805,
"valid_targets_mean": 4027.9,
"valid_targets_min": 1434
},
{
"epoch": 6.175040518638574,
"grad_norm": 0.4458492212785282,
"learning_rate": 1.6751478740203776e-06,
"loss": 0.1461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17976900935173035,
"step": 3810,
"valid_targets_mean": 4864.9,
"valid_targets_min": 2482
},
{
"epoch": 6.183144246353322,
"grad_norm": 0.4227256889119454,
"learning_rate": 1.6429179423909248e-06,
"loss": 0.1419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1274784505367279,
"step": 3815,
"valid_targets_mean": 4209.2,
"valid_targets_min": 1356
},
{
"epoch": 6.191247974068071,
"grad_norm": 0.8626461611916949,
"learning_rate": 1.6109877984068089e-06,
"loss": 0.1324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13011348247528076,
"step": 3820,
"valid_targets_mean": 4491.9,
"valid_targets_min": 2135
},
{
"epoch": 6.19935170178282,
"grad_norm": 0.4238788306714976,
"learning_rate": 1.5793579635159883e-06,
"loss": 0.1311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11838759481906891,
"step": 3825,
"valid_targets_mean": 4214.7,
"valid_targets_min": 1133
},
{
"epoch": 6.207455429497569,
"grad_norm": 0.4599834513527078,
"learning_rate": 1.5480289542620686e-06,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11634839326143265,
"step": 3830,
"valid_targets_mean": 3438.7,
"valid_targets_min": 1400
},
{
"epoch": 6.215559157212318,
"grad_norm": 0.5108850540567319,
"learning_rate": 1.517001282275936e-06,
"loss": 0.1436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14523491263389587,
"step": 3835,
"valid_targets_mean": 3825.8,
"valid_targets_min": 836
},
{
"epoch": 6.223662884927067,
"grad_norm": 0.45879081355549145,
"learning_rate": 1.486275454267354e-06,
"loss": 0.1339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13570156693458557,
"step": 3840,
"valid_targets_mean": 3901.1,
"valid_targets_min": 1254
},
{
"epoch": 6.231766612641815,
"grad_norm": 0.45552777520225757,
"learning_rate": 1.4558519720166975e-06,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15282249450683594,
"step": 3845,
"valid_targets_mean": 4158.1,
"valid_targets_min": 1273
},
{
"epoch": 6.239870340356564,
"grad_norm": 0.3713879886251543,
"learning_rate": 1.4257313323667798e-06,
"loss": 0.1286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11740448325872421,
"step": 3850,
"valid_targets_mean": 4931.4,
"valid_targets_min": 1525
},
{
"epoch": 6.247974068071313,
"grad_norm": 0.4063595181498841,
"learning_rate": 1.3959140272146998e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15681567788124084,
"step": 3855,
"valid_targets_mean": 5654.3,
"valid_targets_min": 1510
},
{
"epoch": 6.256077795786061,
"grad_norm": 0.4542483110057598,
"learning_rate": 1.366400543503854e-06,
"loss": 0.1499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14490097761154175,
"step": 3860,
"valid_targets_mean": 4448.6,
"valid_targets_min": 1146
},
{
"epoch": 6.2641815235008105,
"grad_norm": 0.45532835475196615,
"learning_rate": 1.3371913632159506e-06,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13060614466667175,
"step": 3865,
"valid_targets_mean": 3886.1,
"valid_targets_min": 1264
},
{
"epoch": 6.272285251215559,
"grad_norm": 0.45124326933966985,
"learning_rate": 1.3082869633631413e-06,
"loss": 0.153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1641269326210022,
"step": 3870,
"valid_targets_mean": 4320.4,
"valid_targets_min": 2442
},
{
"epoch": 6.280388978930308,
"grad_norm": 0.4779066296871159,
"learning_rate": 1.2796878159802595e-06,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11321790516376495,
"step": 3875,
"valid_targets_mean": 3432.7,
"valid_targets_min": 1321
},
{
"epoch": 6.288492706645057,
"grad_norm": 0.4951825756797347,
"learning_rate": 1.2513943881170754e-06,
"loss": 0.145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17373144626617432,
"step": 3880,
"valid_targets_mean": 3927.1,
"valid_targets_min": 1325
},
{
"epoch": 6.296596434359805,
"grad_norm": 0.4155816592498077,
"learning_rate": 1.2234071418306903e-06,
"loss": 0.1309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12273648381233215,
"step": 3885,
"valid_targets_mean": 4243.1,
"valid_targets_min": 1539
},
{
"epoch": 6.304700162074554,
"grad_norm": 0.48766069627915243,
"learning_rate": 1.1957265341779855e-06,
"loss": 0.1368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14697131514549255,
"step": 3890,
"valid_targets_mean": 4181.6,
"valid_targets_min": 1177
},
{
"epoch": 6.312803889789303,
"grad_norm": 0.3938083092461327,
"learning_rate": 1.1683530172081592e-06,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12041988968849182,
"step": 3895,
"valid_targets_mean": 5296.3,
"valid_targets_min": 1306
},
{
"epoch": 6.3209076175040515,
"grad_norm": 0.47593597010364025,
"learning_rate": 1.1412870379553387e-06,
"loss": 0.16,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16000404953956604,
"step": 3900,
"valid_targets_mean": 4644.2,
"valid_targets_min": 1309
},
{
"epoch": 6.329011345218801,
"grad_norm": 0.3902721038762542,
"learning_rate": 1.1145290384312846e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14155729115009308,
"step": 3905,
"valid_targets_mean": 5272.6,
"valid_targets_min": 1362
},
{
"epoch": 6.33711507293355,
"grad_norm": 0.4251038760068053,
"learning_rate": 1.0880794556181762e-06,
"loss": 0.1526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15772640705108643,
"step": 3910,
"valid_targets_mean": 4669.5,
"valid_targets_min": 1422
},
{
"epoch": 6.345218800648298,
"grad_norm": 0.40120884770549975,
"learning_rate": 1.0619387214614662e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11130170524120331,
"step": 3915,
"valid_targets_mean": 4427.3,
"valid_targets_min": 1465
},
{
"epoch": 6.353322528363047,
"grad_norm": 0.4546439264922523,
"learning_rate": 1.0361072628628354e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18124914169311523,
"step": 3920,
"valid_targets_mean": 4763.3,
"valid_targets_min": 1333
},
{
"epoch": 6.361426256077796,
"grad_norm": 0.3865469165310739,
"learning_rate": 1.0105855016732113e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440453827381134,
"step": 3925,
"valid_targets_mean": 5420.2,
"valid_targets_min": 1412
},
{
"epoch": 6.369529983792544,
"grad_norm": 0.46212783046959593,
"learning_rate": 9.853738546858893e-07,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12405751645565033,
"step": 3930,
"valid_targets_mean": 3459.2,
"valid_targets_min": 1270
},
{
"epoch": 6.377633711507293,
"grad_norm": 0.45293906022023217,
"learning_rate": 9.604727336297203e-07,
"loss": 0.1312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1338280439376831,
"step": 3935,
"valid_targets_mean": 3815.8,
"valid_targets_min": 1333
},
{
"epoch": 6.3857374392220425,
"grad_norm": 0.4762642698396675,
"learning_rate": 9.358825451623832e-07,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14254039525985718,
"step": 3940,
"valid_targets_mean": 4435.0,
"valid_targets_min": 1307
},
{
"epoch": 6.393841166936791,
"grad_norm": 0.40993514188015256,
"learning_rate": 9.116036908637582e-07,
"loss": 0.1429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13208088278770447,
"step": 3945,
"valid_targets_mean": 4901.5,
"valid_targets_min": 2394
},
{
"epoch": 6.40194489465154,
"grad_norm": 0.4050004148081513,
"learning_rate": 8.876365672293441e-07,
"loss": 0.139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10800512880086899,
"step": 3950,
"valid_targets_mean": 4286.4,
"valid_targets_min": 1533
},
{
"epoch": 6.410048622366288,
"grad_norm": 0.4372028368161644,
"learning_rate": 8.639815656638162e-07,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14087510108947754,
"step": 3955,
"valid_targets_mean": 4526.8,
"valid_targets_min": 1287
},
{
"epoch": 6.418152350081037,
"grad_norm": 0.41474637266063613,
"learning_rate": 8.406390724745961e-07,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17648552358150482,
"step": 3960,
"valid_targets_mean": 6034.9,
"valid_targets_min": 1347
},
{
"epoch": 6.426256077795786,
"grad_norm": 0.4048155564619817,
"learning_rate": 8.176094688655789e-07,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17440642416477203,
"step": 3965,
"valid_targets_mean": 5610.4,
"valid_targets_min": 1310
},
{
"epoch": 6.434359805510534,
"grad_norm": 0.4228276820400858,
"learning_rate": 7.948931309308872e-07,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14183327555656433,
"step": 3970,
"valid_targets_mean": 4442.7,
"valid_targets_min": 1396
},
{
"epoch": 6.4424635332252835,
"grad_norm": 0.4454033902831941,
"learning_rate": 7.724904296487246e-07,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13356520235538483,
"step": 3975,
"valid_targets_mean": 4284.1,
"valid_targets_min": 1373
},
{
"epoch": 6.450567260940033,
"grad_norm": 0.48618002254936554,
"learning_rate": 7.504017308753386e-07,
"loss": 0.1365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11197055876255035,
"step": 3980,
"valid_targets_mean": 3097.4,
"valid_targets_min": 837
},
{
"epoch": 6.458670988654781,
"grad_norm": 1.1613596162903213,
"learning_rate": 7.286273953390278e-07,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13441595435142517,
"step": 3985,
"valid_targets_mean": 5556.1,
"valid_targets_min": 1350
},
{
"epoch": 6.46677471636953,
"grad_norm": 0.4049486224120147,
"learning_rate": 7.071677786342568e-07,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14194028079509735,
"step": 3990,
"valid_targets_mean": 5311.6,
"valid_targets_min": 1465
},
{
"epoch": 6.474878444084279,
"grad_norm": 0.400038102304834,
"learning_rate": 6.860232312158554e-07,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12901249527931213,
"step": 3995,
"valid_targets_mean": 4856.2,
"valid_targets_min": 2179
},
{
"epoch": 6.482982171799027,
"grad_norm": 0.4069486273700877,
"learning_rate": 6.651940983932737e-07,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12928912043571472,
"step": 4000,
"valid_targets_mean": 4616.2,
"valid_targets_min": 848
},
{
"epoch": 6.491085899513776,
"grad_norm": 0.46015930681070816,
"learning_rate": 6.44680720324975e-07,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13234779238700867,
"step": 4005,
"valid_targets_mean": 3336.2,
"valid_targets_min": 1390
},
{
"epoch": 6.4991896272285254,
"grad_norm": 0.4012511213853744,
"learning_rate": 6.244834320128501e-07,
"loss": 0.1472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15023906528949738,
"step": 4010,
"valid_targets_mean": 5269.1,
"valid_targets_min": 2527
},
{
"epoch": 6.507293354943274,
"grad_norm": 0.47744140560962556,
"learning_rate": 6.0460256329677e-07,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656455397605896,
"step": 4015,
"valid_targets_mean": 4372.4,
"valid_targets_min": 1450
},
{
"epoch": 6.515397082658023,
"grad_norm": 0.37939181638585245,
"learning_rate": 5.850384388491814e-07,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1422882229089737,
"step": 4020,
"valid_targets_mean": 5767.8,
"valid_targets_min": 2245
},
{
"epoch": 6.523500810372772,
"grad_norm": 0.3968129940328583,
"learning_rate": 5.657913781698221e-07,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13958857953548431,
"step": 4025,
"valid_targets_mean": 5217.1,
"valid_targets_min": 2293
},
{
"epoch": 6.53160453808752,
"grad_norm": 0.45533894363588545,
"learning_rate": 5.468616955804873e-07,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408911496400833,
"step": 4030,
"valid_targets_mean": 4240.6,
"valid_targets_min": 1458
},
{
"epoch": 6.539708265802269,
"grad_norm": 0.41456973084927484,
"learning_rate": 5.282497002198983e-07,
"loss": 0.151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309795379638672,
"step": 4035,
"valid_targets_mean": 4633.8,
"valid_targets_min": 1539
},
{
"epoch": 6.547811993517017,
"grad_norm": 0.4344790637851775,
"learning_rate": 5.099556960386686e-07,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1465933471918106,
"step": 4040,
"valid_targets_mean": 4904.2,
"valid_targets_min": 2034
},
{
"epoch": 6.5559157212317665,
"grad_norm": 0.4325462479106516,
"learning_rate": 4.919799817943238e-07,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14228688180446625,
"step": 4045,
"valid_targets_mean": 5782.6,
"valid_targets_min": 2144
},
{
"epoch": 6.564019448946516,
"grad_norm": 0.4754686884062165,
"learning_rate": 4.7432285104642703e-07,
"loss": 0.1498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16148260235786438,
"step": 4050,
"valid_targets_mean": 4153.5,
"valid_targets_min": 677
},
{
"epoch": 6.572123176661265,
"grad_norm": 0.42697061151348537,
"learning_rate": 4.569845921517968e-07,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16228759288787842,
"step": 4055,
"valid_targets_mean": 5002.3,
"valid_targets_min": 2511
},
{
"epoch": 6.580226904376013,
"grad_norm": 0.3845365808911217,
"learning_rate": 4.399654882597726e-07,
"loss": 0.1294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13468897342681885,
"step": 4060,
"valid_targets_mean": 5712.8,
"valid_targets_min": 1045
},
{
"epoch": 6.588330632090762,
"grad_norm": 0.39716277545284767,
"learning_rate": 4.232658173076232e-07,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14139370620250702,
"step": 4065,
"valid_targets_mean": 5950.2,
"valid_targets_min": 1399
},
{
"epoch": 6.59643435980551,
"grad_norm": 0.4468084595108756,
"learning_rate": 4.068858520159724e-07,
"loss": 0.1422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1694372296333313,
"step": 4070,
"valid_targets_mean": 4465.2,
"valid_targets_min": 709
},
{
"epoch": 6.604538087520259,
"grad_norm": 0.3671649079013761,
"learning_rate": 3.9082585988437617e-07,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12348531186580658,
"step": 4075,
"valid_targets_mean": 5558.6,
"valid_targets_min": 1388
},
{
"epoch": 6.612641815235008,
"grad_norm": 0.47981089308216524,
"learning_rate": 3.7508610318693684e-07,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13009825348854065,
"step": 4080,
"valid_targets_mean": 3335.6,
"valid_targets_min": 1376
},
{
"epoch": 6.620745542949757,
"grad_norm": 0.47241227108780176,
"learning_rate": 3.596668389680247e-07,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15220530331134796,
"step": 4085,
"valid_targets_mean": 3802.2,
"valid_targets_min": 2348
},
{
"epoch": 6.628849270664506,
"grad_norm": 0.4556695876426719,
"learning_rate": 3.445683190380833e-07,
"loss": 0.1361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12755940854549408,
"step": 4090,
"valid_targets_mean": 3677.8,
"valid_targets_min": 1393
},
{
"epoch": 6.636952998379255,
"grad_norm": 0.441358097986932,
"learning_rate": 3.297907899695019e-07,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13846738636493683,
"step": 4095,
"valid_targets_mean": 4536.4,
"valid_targets_min": 1451
},
{
"epoch": 6.645056726094003,
"grad_norm": 0.48127456616667247,
"learning_rate": 3.1533449309262056e-07,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1750427931547165,
"step": 4100,
"valid_targets_mean": 4037.1,
"valid_targets_min": 1341
},
{
"epoch": 6.653160453808752,
"grad_norm": 0.46639173362247416,
"learning_rate": 3.0119966449174474e-07,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15236026048660278,
"step": 4105,
"valid_targets_mean": 3952.3,
"valid_targets_min": 1369
},
{
"epoch": 6.661264181523501,
"grad_norm": 0.47615735862720293,
"learning_rate": 2.8738653500133494e-07,
"loss": 0.1412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13197392225265503,
"step": 4110,
"valid_targets_mean": 3993.2,
"valid_targets_min": 1323
},
{
"epoch": 6.669367909238249,
"grad_norm": 0.45472799651735124,
"learning_rate": 2.738953302022096e-07,
"loss": 0.1363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.120602548122406,
"step": 4115,
"valid_targets_mean": 3635.4,
"valid_targets_min": 1392
},
{
"epoch": 6.6774716369529985,
"grad_norm": 0.4188546649594025,
"learning_rate": 2.6072627041785925e-07,
"loss": 0.1563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13288158178329468,
"step": 4120,
"valid_targets_mean": 4825.9,
"valid_targets_min": 2039
},
{
"epoch": 6.685575364667747,
"grad_norm": 0.4639950948551984,
"learning_rate": 2.478795707108672e-07,
"loss": 0.1558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1535397320985794,
"step": 4125,
"valid_targets_mean": 4686.6,
"valid_targets_min": 1323
},
{
"epoch": 6.693679092382496,
"grad_norm": 0.41109808884224275,
"learning_rate": 2.3535544087938345e-07,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1529480516910553,
"step": 4130,
"valid_targets_mean": 5588.4,
"valid_targets_min": 2517
},
{
"epoch": 6.701782820097245,
"grad_norm": 0.45926411106835413,
"learning_rate": 2.2315408545370288e-07,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1341223120689392,
"step": 4135,
"valid_targets_mean": 4781.3,
"valid_targets_min": 1876
},
{
"epoch": 6.709886547811994,
"grad_norm": 0.395000259046136,
"learning_rate": 2.1127570369292361e-07,
"loss": 0.1298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14368417859077454,
"step": 4140,
"valid_targets_mean": 5097.6,
"valid_targets_min": 613
},
{
"epoch": 6.717990275526742,
"grad_norm": 0.46210837076522737,
"learning_rate": 1.9972048958168954e-07,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18180908262729645,
"step": 4145,
"valid_targets_mean": 4240.0,
"valid_targets_min": 1223
},
{
"epoch": 6.726094003241491,
"grad_norm": 0.432229949832389,
"learning_rate": 1.8848863182703513e-07,
"loss": 0.1402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1526516079902649,
"step": 4150,
"valid_targets_mean": 5149.5,
"valid_targets_min": 1471
},
{
"epoch": 6.7341977309562395,
"grad_norm": 0.44808799433401697,
"learning_rate": 1.7758031385528784e-07,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15459507703781128,
"step": 4155,
"valid_targets_mean": 4488.3,
"valid_targets_min": 1343
},
{
"epoch": 6.742301458670989,
"grad_norm": 0.44004554566563986,
"learning_rate": 1.6699571380908385e-07,
"loss": 0.1415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15247702598571777,
"step": 4160,
"valid_targets_mean": 4497.5,
"valid_targets_min": 1401
},
{
"epoch": 6.750405186385738,
"grad_norm": 0.43890356060699703,
"learning_rate": 1.5673500454445046e-07,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1325896680355072,
"step": 4165,
"valid_targets_mean": 4162.1,
"valid_targets_min": 1421
},
{
"epoch": 6.758508914100486,
"grad_norm": 0.39932933043091573,
"learning_rate": 1.4679835362799266e-07,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13079729676246643,
"step": 4170,
"valid_targets_mean": 5510.4,
"valid_targets_min": 1409
},
{
"epoch": 6.766612641815235,
"grad_norm": 0.46941869643754247,
"learning_rate": 1.3718592333414881e-07,
"loss": 0.1393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13742662966251373,
"step": 4175,
"valid_targets_mean": 3786.2,
"valid_targets_min": 1376
},
{
"epoch": 6.774716369529984,
"grad_norm": 0.39299371447081305,
"learning_rate": 1.2789787064253934e-07,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12248679995536804,
"step": 4180,
"valid_targets_mean": 4901.8,
"valid_targets_min": 1500
},
{
"epoch": 6.782820097244732,
"grad_norm": 0.43082508409324244,
"learning_rate": 1.1893434723541542e-07,
"loss": 0.1413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12439413368701935,
"step": 4185,
"valid_targets_mean": 3693.9,
"valid_targets_min": 1382
},
{
"epoch": 6.790923824959481,
"grad_norm": 0.4358507033661266,
"learning_rate": 1.1029549949516549e-07,
"loss": 0.1427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15898624062538147,
"step": 4190,
"valid_targets_mean": 4447.9,
"valid_targets_min": 372
},
{
"epoch": 6.7990275526742305,
"grad_norm": 0.4554334548925996,
"learning_rate": 1.0198146850193935e-07,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13918620347976685,
"step": 4195,
"valid_targets_mean": 4084.8,
"valid_targets_min": 1247
},
{
"epoch": 6.807131280388979,
"grad_norm": 0.450900839717058,
"learning_rate": 9.399239003132999e-08,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14567112922668457,
"step": 4200,
"valid_targets_mean": 4257.7,
"valid_targets_min": 971
},
{
"epoch": 6.815235008103728,
"grad_norm": 0.44464926461952875,
"learning_rate": 8.632839455216869e-08,
"loss": 0.1331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11365213990211487,
"step": 4205,
"valid_targets_mean": 3640.5,
"valid_targets_min": 1265
},
{
"epoch": 6.823338735818476,
"grad_norm": 0.4297413425159312,
"learning_rate": 7.89896072243912e-08,
"loss": 0.1449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17040380835533142,
"step": 4210,
"valid_targets_mean": 5029.8,
"valid_targets_min": 1465
},
{
"epoch": 6.831442463533225,
"grad_norm": 0.4265378172405877,
"learning_rate": 7.197614789698604e-08,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628272831439972,
"step": 4215,
"valid_targets_mean": 4827.1,
"valid_targets_min": 2268
},
{
"epoch": 6.839546191247974,
"grad_norm": 0.42738757709554764,
"learning_rate": 6.528813110604714e-08,
"loss": 0.1347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12047109007835388,
"step": 4220,
"valid_targets_mean": 4246.8,
"valid_targets_min": 688
},
{
"epoch": 6.847649918962723,
"grad_norm": 0.5091043582800635,
"learning_rate": 5.8925666072899845e-08,
"loss": 0.1364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1382569521665573,
"step": 4225,
"valid_targets_mean": 3183.8,
"valid_targets_min": 1433
},
{
"epoch": 6.855753646677472,
"grad_norm": 0.4138282308157216,
"learning_rate": 5.288885670231336e-08,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13277751207351685,
"step": 4230,
"valid_targets_mean": 5006.8,
"valid_targets_min": 1974
},
{
"epoch": 6.863857374392221,
"grad_norm": 0.4523192662938565,
"learning_rate": 4.717780158080887e-08,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11566020548343658,
"step": 4235,
"valid_targets_mean": 3727.6,
"valid_targets_min": 1486
},
{
"epoch": 6.871961102106969,
"grad_norm": 0.37548392402675607,
"learning_rate": 4.1792593975049644e-08,
"loss": 0.1369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13377472758293152,
"step": 4240,
"valid_targets_mean": 5953.8,
"valid_targets_min": 1467
},
{
"epoch": 6.880064829821718,
"grad_norm": 0.47007523708634125,
"learning_rate": 3.6733321830315636e-08,
"loss": 0.1392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12267227470874786,
"step": 4245,
"valid_targets_mean": 3472.3,
"valid_targets_min": 2085
},
{
"epoch": 6.888168557536467,
"grad_norm": 0.42709079057303595,
"learning_rate": 3.200006776906461e-08,
"loss": 0.1387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1224164217710495,
"step": 4250,
"valid_targets_mean": 3998.2,
"valid_targets_min": 2443
},
{
"epoch": 6.896272285251215,
"grad_norm": 0.39239537657898,
"learning_rate": 2.7592909089593224e-08,
"loss": 0.1405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14886951446533203,
"step": 4255,
"valid_targets_mean": 5280.1,
"valid_targets_min": 2546
},
{
"epoch": 6.904376012965964,
"grad_norm": 0.3539601345126062,
"learning_rate": 2.351191776475581e-08,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12216240912675858,
"step": 4260,
"valid_targets_mean": 5626.0,
"valid_targets_min": 678
},
{
"epoch": 6.9124797406807135,
"grad_norm": 0.42164253650702077,
"learning_rate": 1.9757160440814217e-08,
"loss": 0.1479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13502494990825653,
"step": 4265,
"valid_targets_mean": 4376.6,
"valid_targets_min": 1339
},
{
"epoch": 6.920583468395462,
"grad_norm": 0.4705700973117692,
"learning_rate": 1.6328698436327562e-08,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14658623933792114,
"step": 4270,
"valid_targets_mean": 3737.1,
"valid_targets_min": 1351
},
{
"epoch": 6.928687196110211,
"grad_norm": 0.41064747368250465,
"learning_rate": 1.3226587741159702e-08,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13569799065589905,
"step": 4275,
"valid_targets_mean": 4845.8,
"valid_targets_min": 1316
},
{
"epoch": 6.93679092382496,
"grad_norm": 0.42620733839378133,
"learning_rate": 1.0450879015566629e-08,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1472766101360321,
"step": 4280,
"valid_targets_mean": 4720.4,
"valid_targets_min": 1342
},
{
"epoch": 6.944894651539708,
"grad_norm": 0.42942547760976824,
"learning_rate": 8.001617589368238e-09,
"loss": 0.1559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17669114470481873,
"step": 4285,
"valid_targets_mean": 4890.8,
"valid_targets_min": 546
},
{
"epoch": 6.952998379254457,
"grad_norm": 0.4720547278800281,
"learning_rate": 5.878843461200046e-09,
"loss": 0.1446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13602668046951294,
"step": 4290,
"valid_targets_mean": 3606.6,
"valid_targets_min": 1438
},
{
"epoch": 6.961102106969205,
"grad_norm": 0.4338336156998582,
"learning_rate": 4.082591297873695e-09,
"loss": 0.1385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18032628297805786,
"step": 4295,
"valid_targets_mean": 4971.6,
"valid_targets_min": 2500
},
{
"epoch": 6.9692058346839545,
"grad_norm": 0.41141829681237335,
"learning_rate": 2.6128904338018624e-09,
"loss": 0.1356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1081404983997345,
"step": 4300,
"valid_targets_mean": 4556.7,
"valid_targets_min": 970
},
{
"epoch": 6.977309562398704,
"grad_norm": 0.4549661229722178,
"learning_rate": 1.4697648705186417e-09,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15801507234573364,
"step": 4305,
"valid_targets_mean": 4676.2,
"valid_targets_min": 1281
},
{
"epoch": 6.985413290113452,
"grad_norm": 0.43854485734031307,
"learning_rate": 6.532332762931859e-10,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.122274249792099,
"step": 4310,
"valid_targets_mean": 3756.2,
"valid_targets_min": 1417
},
{
"epoch": 6.993517017828201,
"grad_norm": 0.5007277079923921,
"learning_rate": 1.6330898581884414e-10,
"loss": 0.1389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1444101631641388,
"step": 4315,
"valid_targets_mean": 3494.4,
"valid_targets_min": 587
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12458416819572449,
"step": 4319,
"total_flos": 1278251302125568.0,
"train_loss": 0.1840376865397341,
"train_runtime": 22883.9619,
"train_samples_per_second": 3.016,
"train_steps_per_second": 0.189,
"valid_targets_mean": 4142.8,
"valid_targets_min": 1361
}
],
"logging_steps": 5,
"max_steps": 4319,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1278251302125568.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}