Files
nemosci-tasrep-a1mfc-dev1-m…/trainer_state.json

8045 lines
224 KiB
JSON
Raw Normal View History

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 5.0,
"eval_steps": 500,
"global_step": 3635,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.006883891693437357,
"grad_norm": 13.694241855634743,
"learning_rate": 4.395604395604396e-07,
"loss": 0.9672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3309265673160553,
"step": 5,
"valid_targets_mean": 8170.6,
"valid_targets_min": 3077
},
{
"epoch": 0.013767783386874713,
"grad_norm": 12.578564323146997,
"learning_rate": 9.890109890109891e-07,
"loss": 0.9668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30831611156463623,
"step": 10,
"valid_targets_mean": 6980.7,
"valid_targets_min": 2298
},
{
"epoch": 0.02065167508031207,
"grad_norm": 7.7944206304684025,
"learning_rate": 1.5384615384615387e-06,
"loss": 0.9211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2686140537261963,
"step": 15,
"valid_targets_mean": 6148.2,
"valid_targets_min": 2167
},
{
"epoch": 0.027535566773749427,
"grad_norm": 3.7615150954296,
"learning_rate": 2.0879120879120883e-06,
"loss": 0.8559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865496277809143,
"step": 20,
"valid_targets_mean": 7165.8,
"valid_targets_min": 2278
},
{
"epoch": 0.03441945846718678,
"grad_norm": 1.9967996468850564,
"learning_rate": 2.6373626373626375e-06,
"loss": 0.7873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2609645128250122,
"step": 25,
"valid_targets_mean": 7202.3,
"valid_targets_min": 2907
},
{
"epoch": 0.04130335016062414,
"grad_norm": 1.642494044026072,
"learning_rate": 3.1868131868131867e-06,
"loss": 0.7615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2548447251319885,
"step": 30,
"valid_targets_mean": 7477.5,
"valid_targets_min": 2714
},
{
"epoch": 0.048187241854061494,
"grad_norm": 1.1331298421000486,
"learning_rate": 3.7362637362637367e-06,
"loss": 0.7274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24324637651443481,
"step": 35,
"valid_targets_mean": 7314.0,
"valid_targets_min": 2883
},
{
"epoch": 0.05507113354749885,
"grad_norm": 0.8610066611189371,
"learning_rate": 4.2857142857142855e-06,
"loss": 0.6803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21853984892368317,
"step": 40,
"valid_targets_mean": 7126.6,
"valid_targets_min": 2597
},
{
"epoch": 0.06195502524093621,
"grad_norm": 0.6199513616997635,
"learning_rate": 4.8351648351648355e-06,
"loss": 0.6548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20629478991031647,
"step": 45,
"valid_targets_mean": 7369.8,
"valid_targets_min": 3375
},
{
"epoch": 0.06883891693437356,
"grad_norm": 0.5292903199674134,
"learning_rate": 5.384615384615385e-06,
"loss": 0.6199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19665127992630005,
"step": 50,
"valid_targets_mean": 7356.4,
"valid_targets_min": 2005
},
{
"epoch": 0.07572280862781092,
"grad_norm": 0.43990945332342174,
"learning_rate": 5.934065934065935e-06,
"loss": 0.5721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17901910841464996,
"step": 55,
"valid_targets_mean": 8719.0,
"valid_targets_min": 589
},
{
"epoch": 0.08260670032124828,
"grad_norm": 0.34345855694621463,
"learning_rate": 6.483516483516485e-06,
"loss": 0.5352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18726885318756104,
"step": 60,
"valid_targets_mean": 9029.5,
"valid_targets_min": 4655
},
{
"epoch": 0.08949059201468564,
"grad_norm": 0.2745587801279678,
"learning_rate": 7.032967032967034e-06,
"loss": 0.509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17130973935127258,
"step": 65,
"valid_targets_mean": 10019.8,
"valid_targets_min": 4996
},
{
"epoch": 0.09637448370812299,
"grad_norm": 0.24899014086502314,
"learning_rate": 7.582417582417583e-06,
"loss": 0.4905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16219963133335114,
"step": 70,
"valid_targets_mean": 9413.2,
"valid_targets_min": 3337
},
{
"epoch": 0.10325837540156035,
"grad_norm": 0.6632172104478877,
"learning_rate": 8.131868131868132e-06,
"loss": 0.4843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16867445409297943,
"step": 75,
"valid_targets_mean": 10127.1,
"valid_targets_min": 3360
},
{
"epoch": 0.1101422670949977,
"grad_norm": 0.22112536714345443,
"learning_rate": 8.681318681318681e-06,
"loss": 0.4647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16406437754631042,
"step": 80,
"valid_targets_mean": 9319.1,
"valid_targets_min": 685
},
{
"epoch": 0.11702615878843506,
"grad_norm": 0.23254063354964463,
"learning_rate": 9.230769230769232e-06,
"loss": 0.4668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15404294431209564,
"step": 85,
"valid_targets_mean": 9109.9,
"valid_targets_min": 4379
},
{
"epoch": 0.12391005048187242,
"grad_norm": 0.2289262735187177,
"learning_rate": 9.780219780219781e-06,
"loss": 0.4513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14573627710342407,
"step": 90,
"valid_targets_mean": 9313.2,
"valid_targets_min": 3452
},
{
"epoch": 0.13079394217530976,
"grad_norm": 0.2069573644523245,
"learning_rate": 1.0329670329670332e-05,
"loss": 0.444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14479273557662964,
"step": 95,
"valid_targets_mean": 8640.9,
"valid_targets_min": 383
},
{
"epoch": 0.13767783386874713,
"grad_norm": 0.2358199789841859,
"learning_rate": 1.087912087912088e-05,
"loss": 0.4416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14525240659713745,
"step": 100,
"valid_targets_mean": 9029.9,
"valid_targets_min": 4552
},
{
"epoch": 0.1445617255621845,
"grad_norm": 0.21577235061513939,
"learning_rate": 1.1428571428571429e-05,
"loss": 0.4334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14647001028060913,
"step": 105,
"valid_targets_mean": 10390.2,
"valid_targets_min": 4833
},
{
"epoch": 0.15144561725562183,
"grad_norm": 0.23169177022891713,
"learning_rate": 1.1978021978021978e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14595040678977966,
"step": 110,
"valid_targets_mean": 9771.6,
"valid_targets_min": 3641
},
{
"epoch": 0.1583295089490592,
"grad_norm": 0.23315620907648432,
"learning_rate": 1.2527472527472529e-05,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13074077665805817,
"step": 115,
"valid_targets_mean": 9316.0,
"valid_targets_min": 1929
},
{
"epoch": 0.16521340064249657,
"grad_norm": 0.23578755278571784,
"learning_rate": 1.3076923076923078e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14109788835048676,
"step": 120,
"valid_targets_mean": 9838.7,
"valid_targets_min": 4324
},
{
"epoch": 0.1720972923359339,
"grad_norm": 0.244154827729474,
"learning_rate": 1.3626373626373627e-05,
"loss": 0.4272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14524628221988678,
"step": 125,
"valid_targets_mean": 9693.1,
"valid_targets_min": 3811
},
{
"epoch": 0.17898118402937127,
"grad_norm": 0.2089268624041823,
"learning_rate": 1.4175824175824178e-05,
"loss": 0.4122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12458304315805435,
"step": 130,
"valid_targets_mean": 9686.9,
"valid_targets_min": 3338
},
{
"epoch": 0.18586507572280864,
"grad_norm": 0.2328880543137963,
"learning_rate": 1.4725274725274727e-05,
"loss": 0.4021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12566791474819183,
"step": 135,
"valid_targets_mean": 9590.6,
"valid_targets_min": 4785
},
{
"epoch": 0.19274896741624598,
"grad_norm": 0.22383231353766703,
"learning_rate": 1.5274725274725277e-05,
"loss": 0.4044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14299173653125763,
"step": 140,
"valid_targets_mean": 10718.9,
"valid_targets_min": 4892
},
{
"epoch": 0.19963285910968334,
"grad_norm": 0.2464207171177229,
"learning_rate": 1.5824175824175826e-05,
"loss": 0.4077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1544559895992279,
"step": 145,
"valid_targets_mean": 10753.2,
"valid_targets_min": 3836
},
{
"epoch": 0.2065167508031207,
"grad_norm": 0.22729169591824225,
"learning_rate": 1.6373626373626375e-05,
"loss": 0.4011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11852603405714035,
"step": 150,
"valid_targets_mean": 8877.9,
"valid_targets_min": 424
},
{
"epoch": 0.21340064249655805,
"grad_norm": 0.22989523354603325,
"learning_rate": 1.6923076923076924e-05,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1433342844247818,
"step": 155,
"valid_targets_mean": 11518.0,
"valid_targets_min": 4504
},
{
"epoch": 0.2202845341899954,
"grad_norm": 0.2669020061521446,
"learning_rate": 1.7472527472527473e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14459729194641113,
"step": 160,
"valid_targets_mean": 10316.1,
"valid_targets_min": 4842
},
{
"epoch": 0.22716842588343278,
"grad_norm": 0.23145661525974606,
"learning_rate": 1.8021978021978023e-05,
"loss": 0.3972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13346941769123077,
"step": 165,
"valid_targets_mean": 10630.5,
"valid_targets_min": 5085
},
{
"epoch": 0.23405231757687012,
"grad_norm": 0.23112572970307219,
"learning_rate": 1.8571428571428575e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14197933673858643,
"step": 170,
"valid_targets_mean": 10322.6,
"valid_targets_min": 4928
},
{
"epoch": 0.24093620927030748,
"grad_norm": 0.2707224338675443,
"learning_rate": 1.9120879120879124e-05,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13661183416843414,
"step": 175,
"valid_targets_mean": 10297.2,
"valid_targets_min": 3888
},
{
"epoch": 0.24782010096374485,
"grad_norm": 0.2622838211701269,
"learning_rate": 1.967032967032967e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12619677186012268,
"step": 180,
"valid_targets_mean": 8726.7,
"valid_targets_min": 265
},
{
"epoch": 0.2547039926571822,
"grad_norm": 0.3018730334828126,
"learning_rate": 2.021978021978022e-05,
"loss": 0.3827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11439290642738342,
"step": 185,
"valid_targets_mean": 8473.2,
"valid_targets_min": 3703
},
{
"epoch": 0.2615878843506195,
"grad_norm": 0.27854199506530175,
"learning_rate": 2.0769230769230772e-05,
"loss": 0.3852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1296503096818924,
"step": 190,
"valid_targets_mean": 10562.8,
"valid_targets_min": 4059
},
{
"epoch": 0.2684717760440569,
"grad_norm": 0.32965118396403853,
"learning_rate": 2.131868131868132e-05,
"loss": 0.4062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13311529159545898,
"step": 195,
"valid_targets_mean": 5732.4,
"valid_targets_min": 996
},
{
"epoch": 0.27535566773749426,
"grad_norm": 0.34563256253130675,
"learning_rate": 2.1868131868131867e-05,
"loss": 0.4219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13766756653785706,
"step": 200,
"valid_targets_mean": 5909.7,
"valid_targets_min": 322
},
{
"epoch": 0.2822395594309316,
"grad_norm": 3.800335015027523,
"learning_rate": 2.241758241758242e-05,
"loss": 0.6701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3517041504383087,
"step": 205,
"valid_targets_mean": 3622.3,
"valid_targets_min": 1417
},
{
"epoch": 0.289123451124369,
"grad_norm": 1.2361781661013793,
"learning_rate": 2.296703296703297e-05,
"loss": 0.9022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3068923056125641,
"step": 210,
"valid_targets_mean": 4234.8,
"valid_targets_min": 1229
},
{
"epoch": 0.29600734281780633,
"grad_norm": 0.5360103186756147,
"learning_rate": 2.3516483516483518e-05,
"loss": 0.7856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1845906674861908,
"step": 215,
"valid_targets_mean": 3496.8,
"valid_targets_min": 792
},
{
"epoch": 0.30289123451124367,
"grad_norm": 0.4462165113821834,
"learning_rate": 2.4065934065934067e-05,
"loss": 0.8366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27402248978614807,
"step": 220,
"valid_targets_mean": 4790.7,
"valid_targets_min": 1423
},
{
"epoch": 0.30977512620468106,
"grad_norm": 0.4075124579712277,
"learning_rate": 2.461538461538462e-05,
"loss": 0.7601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29145288467407227,
"step": 225,
"valid_targets_mean": 4529.3,
"valid_targets_min": 1236
},
{
"epoch": 0.3166590178981184,
"grad_norm": 0.37093297756645077,
"learning_rate": 2.5164835164835165e-05,
"loss": 0.7176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21884280443191528,
"step": 230,
"valid_targets_mean": 3307.1,
"valid_targets_min": 1399
},
{
"epoch": 0.32354290959155574,
"grad_norm": 0.3496546260867017,
"learning_rate": 2.5714285714285718e-05,
"loss": 0.7248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23322607576847076,
"step": 235,
"valid_targets_mean": 4017.8,
"valid_targets_min": 1176
},
{
"epoch": 0.33042680128499313,
"grad_norm": 0.3187272125501439,
"learning_rate": 2.6263736263736267e-05,
"loss": 0.6923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14147228002548218,
"step": 240,
"valid_targets_mean": 1564.6,
"valid_targets_min": 635
},
{
"epoch": 0.33731069297843047,
"grad_norm": 0.28962426263990193,
"learning_rate": 2.6813186813186813e-05,
"loss": 0.7099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24177516996860504,
"step": 245,
"valid_targets_mean": 4694.7,
"valid_targets_min": 1910
},
{
"epoch": 0.3441945846718678,
"grad_norm": 0.35220902165497164,
"learning_rate": 2.7362637362637365e-05,
"loss": 0.6842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2731242775917053,
"step": 250,
"valid_targets_mean": 4543.5,
"valid_targets_min": 712
},
{
"epoch": 0.3510784763653052,
"grad_norm": 0.3316735178709283,
"learning_rate": 2.7912087912087915e-05,
"loss": 0.6671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2385597825050354,
"step": 255,
"valid_targets_mean": 3509.4,
"valid_targets_min": 1442
},
{
"epoch": 0.35796236805874254,
"grad_norm": 0.30655273710875297,
"learning_rate": 2.8461538461538464e-05,
"loss": 0.6768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1650443971157074,
"step": 260,
"valid_targets_mean": 3599.4,
"valid_targets_min": 328
},
{
"epoch": 0.3648462597521799,
"grad_norm": 0.34083054525967005,
"learning_rate": 2.9010989010989013e-05,
"loss": 0.639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11122392863035202,
"step": 265,
"valid_targets_mean": 980.5,
"valid_targets_min": 475
},
{
"epoch": 0.3717301514456173,
"grad_norm": 0.3124276244867637,
"learning_rate": 2.9560439560439565e-05,
"loss": 0.6749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24359172582626343,
"step": 270,
"valid_targets_mean": 4849.9,
"valid_targets_min": 1243
},
{
"epoch": 0.3786140431390546,
"grad_norm": 0.3181564926526228,
"learning_rate": 3.010989010989011e-05,
"loss": 0.6522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2207922339439392,
"step": 275,
"valid_targets_mean": 4380.0,
"valid_targets_min": 1142
},
{
"epoch": 0.38549793483249195,
"grad_norm": 0.37007524888913634,
"learning_rate": 3.065934065934067e-05,
"loss": 0.6879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25520047545433044,
"step": 280,
"valid_targets_mean": 3904.7,
"valid_targets_min": 1187
},
{
"epoch": 0.39238182652592934,
"grad_norm": 0.30196455505898595,
"learning_rate": 3.120879120879121e-05,
"loss": 0.6619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1992959976196289,
"step": 285,
"valid_targets_mean": 3962.2,
"valid_targets_min": 1010
},
{
"epoch": 0.3992657182193667,
"grad_norm": 0.37081909199931196,
"learning_rate": 3.175824175824176e-05,
"loss": 0.6366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13232207298278809,
"step": 290,
"valid_targets_mean": 1099.3,
"valid_targets_min": 280
},
{
"epoch": 0.406149609912804,
"grad_norm": 0.3104836906355742,
"learning_rate": 3.230769230769231e-05,
"loss": 0.6609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24800434708595276,
"step": 295,
"valid_targets_mean": 5050.1,
"valid_targets_min": 1178
},
{
"epoch": 0.4130335016062414,
"grad_norm": 0.28643747421830573,
"learning_rate": 3.285714285714286e-05,
"loss": 0.6472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2316061109304428,
"step": 300,
"valid_targets_mean": 5151.1,
"valid_targets_min": 1346
},
{
"epoch": 0.41991739329967875,
"grad_norm": 0.32511728531116485,
"learning_rate": 3.340659340659341e-05,
"loss": 0.4525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09048983454704285,
"step": 305,
"valid_targets_mean": 5515.5,
"valid_targets_min": 1936
},
{
"epoch": 0.4268012849931161,
"grad_norm": 0.30988433634655266,
"learning_rate": 3.3956043956043956e-05,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07446835190057755,
"step": 310,
"valid_targets_mean": 5127.6,
"valid_targets_min": 2180
},
{
"epoch": 0.4336851766865535,
"grad_norm": 0.2617016938161096,
"learning_rate": 3.450549450549451e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06975876539945602,
"step": 315,
"valid_targets_mean": 5021.8,
"valid_targets_min": 2808
},
{
"epoch": 0.4405690683799908,
"grad_norm": 0.2685638299614147,
"learning_rate": 3.505494505494506e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07339228689670563,
"step": 320,
"valid_targets_mean": 5327.4,
"valid_targets_min": 2771
},
{
"epoch": 0.44745296007342816,
"grad_norm": 0.2621136266965172,
"learning_rate": 3.56043956043956e-05,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08050457388162613,
"step": 325,
"valid_targets_mean": 5568.0,
"valid_targets_min": 3219
},
{
"epoch": 0.45433685176686556,
"grad_norm": 0.28262871610816387,
"learning_rate": 3.615384615384616e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0704975575208664,
"step": 330,
"valid_targets_mean": 5279.6,
"valid_targets_min": 3339
},
{
"epoch": 0.4612207434603029,
"grad_norm": 0.23957182507594812,
"learning_rate": 3.67032967032967e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06967966258525848,
"step": 335,
"valid_targets_mean": 5462.8,
"valid_targets_min": 1825
},
{
"epoch": 0.46810463515374023,
"grad_norm": 0.2590213889061684,
"learning_rate": 3.725274725274726e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06722544878721237,
"step": 340,
"valid_targets_mean": 5447.9,
"valid_targets_min": 2456
},
{
"epoch": 0.47498852684717763,
"grad_norm": 0.2786922148808639,
"learning_rate": 3.7802197802197807e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07029011845588684,
"step": 345,
"valid_targets_mean": 5365.3,
"valid_targets_min": 2902
},
{
"epoch": 0.48187241854061497,
"grad_norm": 0.24349634807812348,
"learning_rate": 3.8351648351648356e-05,
"loss": 0.1988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.063286691904068,
"step": 350,
"valid_targets_mean": 4987.0,
"valid_targets_min": 3287
},
{
"epoch": 0.4887563102340523,
"grad_norm": 0.22666899467248464,
"learning_rate": 3.8901098901098905e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05999894440174103,
"step": 355,
"valid_targets_mean": 5047.8,
"valid_targets_min": 2252
},
{
"epoch": 0.4956402019274897,
"grad_norm": 0.2326604668633739,
"learning_rate": 3.9450549450549454e-05,
"loss": 0.1993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07216238975524902,
"step": 360,
"valid_targets_mean": 5323.9,
"valid_targets_min": 2401
},
{
"epoch": 0.502524093620927,
"grad_norm": 0.23872575419905823,
"learning_rate": 4e-05,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06324415653944016,
"step": 365,
"valid_targets_mean": 5421.0,
"valid_targets_min": 916
},
{
"epoch": 0.5094079853143644,
"grad_norm": 0.24034930967082238,
"learning_rate": 3.999976939016174e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059262461960315704,
"step": 370,
"valid_targets_mean": 5157.3,
"valid_targets_min": 2787
},
{
"epoch": 0.5162918770078018,
"grad_norm": 0.2633330384697458,
"learning_rate": 3.999907756596503e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06677208840847015,
"step": 375,
"valid_targets_mean": 5285.9,
"valid_targets_min": 2725
},
{
"epoch": 0.523175768701239,
"grad_norm": 0.20733514452513443,
"learning_rate": 3.999792454336403e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06367021799087524,
"step": 380,
"valid_targets_mean": 4471.1,
"valid_targets_min": 773
},
{
"epoch": 0.5300596603946764,
"grad_norm": 0.22923343428156906,
"learning_rate": 3.999631034894857e-05,
"loss": 0.1933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06512193381786346,
"step": 385,
"valid_targets_mean": 5323.2,
"valid_targets_min": 3113
},
{
"epoch": 0.5369435520881138,
"grad_norm": 0.21779536364748414,
"learning_rate": 3.999423501994356e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06609879434108734,
"step": 390,
"valid_targets_mean": 5507.8,
"valid_targets_min": 3054
},
{
"epoch": 0.5438274437815511,
"grad_norm": 0.24992019658429662,
"learning_rate": 3.999169860420813e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06085608899593353,
"step": 395,
"valid_targets_mean": 5065.1,
"valid_targets_min": 2739
},
{
"epoch": 0.5507113354749885,
"grad_norm": 0.23256672963489214,
"learning_rate": 3.9988701160234525e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0652182325720787,
"step": 400,
"valid_targets_mean": 5267.3,
"valid_targets_min": 3285
},
{
"epoch": 0.5575952271684259,
"grad_norm": 0.20980766039558524,
"learning_rate": 3.998524275714675e-05,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06631162762641907,
"step": 405,
"valid_targets_mean": 5350.7,
"valid_targets_min": 2809
},
{
"epoch": 0.5644791188618632,
"grad_norm": 0.47517037709324333,
"learning_rate": 3.998132347469898e-05,
"loss": 0.5104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19077736139297485,
"step": 410,
"valid_targets_mean": 4092.8,
"valid_targets_min": 1262
},
{
"epoch": 0.5713630105553006,
"grad_norm": 0.33682213693847374,
"learning_rate": 3.997694340327373e-05,
"loss": 0.5536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18831773102283478,
"step": 415,
"valid_targets_mean": 3959.6,
"valid_targets_min": 922
},
{
"epoch": 0.578246902248738,
"grad_norm": 0.35226360811084995,
"learning_rate": 3.9972102643879754e-05,
"loss": 0.5528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17390920221805573,
"step": 420,
"valid_targets_mean": 3500.9,
"valid_targets_min": 1193
},
{
"epoch": 0.5851307939421753,
"grad_norm": 0.3482865590559308,
"learning_rate": 3.996680130814972e-05,
"loss": 0.5426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17027497291564941,
"step": 425,
"valid_targets_mean": 3293.8,
"valid_targets_min": 1211
},
{
"epoch": 0.5920146856356127,
"grad_norm": 0.2975124836077972,
"learning_rate": 3.996103951833766e-05,
"loss": 0.5358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929185539484024,
"step": 430,
"valid_targets_mean": 4374.8,
"valid_targets_min": 1271
},
{
"epoch": 0.59889857732905,
"grad_norm": 0.3333015107750898,
"learning_rate": 3.995481740731609e-05,
"loss": 0.5545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15541371703147888,
"step": 435,
"valid_targets_mean": 2742.0,
"valid_targets_min": 1163
},
{
"epoch": 0.6057824690224873,
"grad_norm": 0.36064760501351867,
"learning_rate": 3.994813511857304e-05,
"loss": 0.528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17974039912223816,
"step": 440,
"valid_targets_mean": 2944.6,
"valid_targets_min": 747
},
{
"epoch": 0.6126663607159247,
"grad_norm": 0.33429331281353,
"learning_rate": 3.994099280620865e-05,
"loss": 0.4993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10126718133687973,
"step": 445,
"valid_targets_mean": 1390.7,
"valid_targets_min": 617
},
{
"epoch": 0.6195502524093621,
"grad_norm": 0.2999415809286727,
"learning_rate": 3.9933390634931674e-05,
"loss": 0.5597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20320364832878113,
"step": 450,
"valid_targets_mean": 5282.3,
"valid_targets_min": 1416
},
{
"epoch": 0.6264341441027994,
"grad_norm": 0.3059815328895148,
"learning_rate": 3.992532878005565e-05,
"loss": 0.5185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21273663640022278,
"step": 455,
"valid_targets_mean": 5102.7,
"valid_targets_min": 635
},
{
"epoch": 0.6333180357962368,
"grad_norm": 0.30974645010152174,
"learning_rate": 3.9916807427494895e-05,
"loss": 0.541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17771270871162415,
"step": 460,
"valid_targets_mean": 4471.8,
"valid_targets_min": 1166
},
{
"epoch": 0.6402019274896742,
"grad_norm": 0.3374419937482823,
"learning_rate": 3.9907826773760175e-05,
"loss": 0.5126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18608638644218445,
"step": 465,
"valid_targets_mean": 3015.3,
"valid_targets_min": 644
},
{
"epoch": 0.6470858191831115,
"grad_norm": 0.3305201729547266,
"learning_rate": 3.98983870259542e-05,
"loss": 0.5091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16256271302700043,
"step": 470,
"valid_targets_mean": 4168.5,
"valid_targets_min": 1159
},
{
"epoch": 0.6539697108765489,
"grad_norm": 0.314999512758721,
"learning_rate": 3.988848840176685e-05,
"loss": 0.5552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19044813513755798,
"step": 475,
"valid_targets_mean": 4139.7,
"valid_targets_min": 1171
},
{
"epoch": 0.6608536025699863,
"grad_norm": 0.3304218478626873,
"learning_rate": 3.987813112947013e-05,
"loss": 0.5305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1605474352836609,
"step": 480,
"valid_targets_mean": 3524.7,
"valid_targets_min": 706
},
{
"epoch": 0.6677374942634235,
"grad_norm": 0.5399772854729523,
"learning_rate": 3.986731544791293e-05,
"loss": 0.5285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13693946599960327,
"step": 485,
"valid_targets_mean": 974.1,
"valid_targets_min": 373
},
{
"epoch": 0.6746213859568609,
"grad_norm": 0.29344221922807473,
"learning_rate": 3.9856041606515514e-05,
"loss": 0.5146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15577596426010132,
"step": 490,
"valid_targets_mean": 4034.9,
"valid_targets_min": 1413
},
{
"epoch": 0.6815052776502983,
"grad_norm": 0.30625888942494645,
"learning_rate": 3.984430986526375e-05,
"loss": 0.5226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18413081765174866,
"step": 495,
"valid_targets_mean": 4597.8,
"valid_targets_min": 1386
},
{
"epoch": 0.6883891693437356,
"grad_norm": 0.35972444033240863,
"learning_rate": 3.983212049470313e-05,
"loss": 0.5065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14991965889930725,
"step": 500,
"valid_targets_mean": 3344.0,
"valid_targets_min": 1074
},
{
"epoch": 0.695273061037173,
"grad_norm": 0.2963430462822694,
"learning_rate": 3.981947377593254e-05,
"loss": 0.5326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25120216608047485,
"step": 505,
"valid_targets_mean": 4781.9,
"valid_targets_min": 1038
},
{
"epoch": 0.7021569527306104,
"grad_norm": 0.2728001352410558,
"learning_rate": 3.9806370000597745e-05,
"loss": 0.5083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14410412311553955,
"step": 510,
"valid_targets_mean": 4052.2,
"valid_targets_min": 1148
},
{
"epoch": 0.7090408444240477,
"grad_norm": 0.29626178481350945,
"learning_rate": 3.9792809470884705e-05,
"loss": 0.4415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09617213904857635,
"step": 515,
"valid_targets_mean": 5513.2,
"valid_targets_min": 260
},
{
"epoch": 0.7159247361174851,
"grad_norm": 0.28371396859472753,
"learning_rate": 3.977879249951258e-05,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1328997015953064,
"step": 520,
"valid_targets_mean": 6674.3,
"valid_targets_min": 667
},
{
"epoch": 0.7228086278109225,
"grad_norm": 0.260103490841822,
"learning_rate": 3.976431940972651e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11287006735801697,
"step": 525,
"valid_targets_mean": 5004.6,
"valid_targets_min": 184
},
{
"epoch": 0.7296925195043598,
"grad_norm": 0.2368718325327304,
"learning_rate": 3.974939053529019e-05,
"loss": 0.352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11172248423099518,
"step": 530,
"valid_targets_mean": 6059.3,
"valid_targets_min": 496
},
{
"epoch": 0.7365764111977972,
"grad_norm": 0.2320176040482457,
"learning_rate": 3.9734006220478156e-05,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055815745145082474,
"step": 535,
"valid_targets_mean": 1604.8,
"valid_targets_min": 520
},
{
"epoch": 0.7434603028912345,
"grad_norm": 0.23911921052474808,
"learning_rate": 3.971816682006783e-05,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09215737134218216,
"step": 540,
"valid_targets_mean": 6672.8,
"valid_targets_min": 750
},
{
"epoch": 0.7503441945846718,
"grad_norm": 0.23373511921257778,
"learning_rate": 3.9701872699331384e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10297545790672302,
"step": 545,
"valid_targets_mean": 5849.8,
"valid_targets_min": 225
},
{
"epoch": 0.7572280862781092,
"grad_norm": 0.2224554796838409,
"learning_rate": 3.9685124234027264e-05,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11439158767461777,
"step": 550,
"valid_targets_mean": 6783.3,
"valid_targets_min": 643
},
{
"epoch": 0.7641119779715466,
"grad_norm": 0.20688218598394778,
"learning_rate": 3.966792181039156e-05,
"loss": 0.3208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09738504886627197,
"step": 555,
"valid_targets_mean": 6440.8,
"valid_targets_min": 392
},
{
"epoch": 0.7709958696649839,
"grad_norm": 0.2515540099960665,
"learning_rate": 3.965026582512908e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17061451077461243,
"step": 560,
"valid_targets_mean": 8714.9,
"valid_targets_min": 1646
},
{
"epoch": 0.7778797613584213,
"grad_norm": 0.24202712344703942,
"learning_rate": 3.963215668540423e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08065859973430634,
"step": 565,
"valid_targets_mean": 6242.6,
"valid_targets_min": 1338
},
{
"epoch": 0.7847636530518587,
"grad_norm": 0.20728694668286363,
"learning_rate": 3.9613594808831565e-05,
"loss": 0.324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1332765817642212,
"step": 570,
"valid_targets_mean": 7600.2,
"valid_targets_min": 399
},
{
"epoch": 0.791647544745296,
"grad_norm": 0.22011068416498333,
"learning_rate": 3.959458062346624e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07994946092367172,
"step": 575,
"valid_targets_mean": 6031.7,
"valid_targets_min": 993
},
{
"epoch": 0.7985314364387334,
"grad_norm": 0.20100710625863627,
"learning_rate": 3.957511456779407e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09593126177787781,
"step": 580,
"valid_targets_mean": 6480.3,
"valid_targets_min": 279
},
{
"epoch": 0.8054153281321708,
"grad_norm": 0.204267562824806,
"learning_rate": 3.9555197090721446e-05,
"loss": 0.3282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08679480850696564,
"step": 585,
"valid_targets_mean": 6095.1,
"valid_targets_min": 1420
},
{
"epoch": 0.812299219825608,
"grad_norm": 0.20762239543542987,
"learning_rate": 3.9534828651564987e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09902271628379822,
"step": 590,
"valid_targets_mean": 6487.8,
"valid_targets_min": 491
},
{
"epoch": 0.8191831115190454,
"grad_norm": 0.24753637813892274,
"learning_rate": 3.951400972004094e-05,
"loss": 0.2981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08057793974876404,
"step": 595,
"valid_targets_mean": 1157.9,
"valid_targets_min": 493
},
{
"epoch": 0.8260670032124828,
"grad_norm": 0.21936291447133946,
"learning_rate": 3.949274077625435e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10192103683948517,
"step": 600,
"valid_targets_mean": 6671.6,
"valid_targets_min": 354
},
{
"epoch": 0.8329508949059201,
"grad_norm": 0.22563637490059102,
"learning_rate": 3.947102231068798e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12188886851072311,
"step": 605,
"valid_targets_mean": 7020.9,
"valid_targets_min": 848
},
{
"epoch": 0.8398347865993575,
"grad_norm": 0.39524725243572917,
"learning_rate": 3.944885482419102e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10121281445026398,
"step": 610,
"valid_targets_mean": 3855.2,
"valid_targets_min": 967
},
{
"epoch": 0.8467186782927949,
"grad_norm": 0.2991875521643564,
"learning_rate": 3.942623882796751e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10876717418432236,
"step": 615,
"valid_targets_mean": 4457.2,
"valid_targets_min": 642
},
{
"epoch": 0.8536025699862322,
"grad_norm": 0.2875325088708275,
"learning_rate": 3.940317484356459e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09426983445882797,
"step": 620,
"valid_targets_mean": 3784.5,
"valid_targets_min": 456
},
{
"epoch": 0.8604864616796696,
"grad_norm": 0.26938998781457324,
"learning_rate": 3.93796634028604e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09109891951084137,
"step": 625,
"valid_targets_mean": 3845.3,
"valid_targets_min": 338
},
{
"epoch": 0.867370353373107,
"grad_norm": 0.2668306298041638,
"learning_rate": 3.935570504805192e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10715287178754807,
"step": 630,
"valid_targets_mean": 4422.9,
"valid_targets_min": 1886
},
{
"epoch": 0.8742542450665443,
"grad_norm": 0.2619060097050138,
"learning_rate": 3.933130033164238e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09461759775876999,
"step": 635,
"valid_targets_mean": 4114.4,
"valid_targets_min": 738
},
{
"epoch": 0.8811381367599816,
"grad_norm": 0.29246965248688367,
"learning_rate": 3.930644981642854e-05,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0922466367483139,
"step": 640,
"valid_targets_mean": 3997.7,
"valid_targets_min": 1348
},
{
"epoch": 0.888022028453419,
"grad_norm": 0.27956681063543165,
"learning_rate": 3.928115407548774e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07921630144119263,
"step": 645,
"valid_targets_mean": 3248.9,
"valid_targets_min": 330
},
{
"epoch": 0.8949059201468563,
"grad_norm": 0.3100537797560849,
"learning_rate": 3.925541369216465e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09321758151054382,
"step": 650,
"valid_targets_mean": 4329.2,
"valid_targets_min": 1777
},
{
"epoch": 0.9017898118402937,
"grad_norm": 0.23952771554338054,
"learning_rate": 3.9229229260057824e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08680932223796844,
"step": 655,
"valid_targets_mean": 3712.8,
"valid_targets_min": 421
},
{
"epoch": 0.9086737035337311,
"grad_norm": 0.2475904156940587,
"learning_rate": 3.920260138300604e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07667960226535797,
"step": 660,
"valid_targets_mean": 3789.1,
"valid_targets_min": 454
},
{
"epoch": 0.9155575952271684,
"grad_norm": 0.26171304487950436,
"learning_rate": 3.917553067507433e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09974247217178345,
"step": 665,
"valid_targets_mean": 3968.0,
"valid_targets_min": 349
},
{
"epoch": 0.9224414869206058,
"grad_norm": 0.2404358549592192,
"learning_rate": 3.914801776053986e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07945016771554947,
"step": 670,
"valid_targets_mean": 3647.0,
"valid_targets_min": 470
},
{
"epoch": 0.9293253786140432,
"grad_norm": 0.2460827868496975,
"learning_rate": 3.91200632738775e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07959331572055817,
"step": 675,
"valid_targets_mean": 3824.6,
"valid_targets_min": 559
},
{
"epoch": 0.9362092703074805,
"grad_norm": 0.24390454380801813,
"learning_rate": 3.9091667859745225e-05,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08360792696475983,
"step": 680,
"valid_targets_mean": 3890.2,
"valid_targets_min": 1822
},
{
"epoch": 0.9430931620009179,
"grad_norm": 0.4337940381759169,
"learning_rate": 3.9062832172969206e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11606889218091965,
"step": 685,
"valid_targets_mean": 7327.0,
"valid_targets_min": 1240
},
{
"epoch": 0.9499770536943553,
"grad_norm": 0.30889787404915514,
"learning_rate": 3.903355687852876e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1101982593536377,
"step": 690,
"valid_targets_mean": 7614.4,
"valid_targets_min": 389
},
{
"epoch": 0.9568609453877925,
"grad_norm": 0.2542265522759153,
"learning_rate": 3.900384265154098e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09973853081464767,
"step": 695,
"valid_targets_mean": 7250.6,
"valid_targets_min": 2163
},
{
"epoch": 0.9637448370812299,
"grad_norm": 0.2901157227890436,
"learning_rate": 3.897369017724517e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10261671245098114,
"step": 700,
"valid_targets_mean": 6762.3,
"valid_targets_min": 541
},
{
"epoch": 0.9706287287746673,
"grad_norm": 0.25100553909772455,
"learning_rate": 3.894310015098705e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11131678521633148,
"step": 705,
"valid_targets_mean": 6911.7,
"valid_targets_min": 306
},
{
"epoch": 0.9775126204681046,
"grad_norm": 0.25326241165531344,
"learning_rate": 3.8912073278202716e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10062243789434433,
"step": 710,
"valid_targets_mean": 7406.8,
"valid_targets_min": 457
},
{
"epoch": 0.984396512161542,
"grad_norm": 0.24214203836987996,
"learning_rate": 3.88806102744024e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09995930641889572,
"step": 715,
"valid_targets_mean": 7208.4,
"valid_targets_min": 3982
},
{
"epoch": 0.9912804038549794,
"grad_norm": 0.20629658879201448,
"learning_rate": 3.8848711865153906e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08350709080696106,
"step": 720,
"valid_targets_mean": 6352.4,
"valid_targets_min": 410
},
{
"epoch": 0.9981642955484167,
"grad_norm": 0.22921521139927106,
"learning_rate": 3.881637878606594e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09085282683372498,
"step": 725,
"valid_targets_mean": 6267.2,
"valid_targets_min": 102
},
{
"epoch": 1.0041303350160624,
"grad_norm": 1.2507481131485862,
"learning_rate": 3.878361178277111e-05,
"loss": 0.5635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2309202402830124,
"step": 730,
"valid_targets_mean": 7854.0,
"valid_targets_min": 2676
},
{
"epoch": 1.0110142267094997,
"grad_norm": 0.7360689628527337,
"learning_rate": 3.875041161090875e-05,
"loss": 0.564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16059252619743347,
"step": 735,
"valid_targets_mean": 6740.2,
"valid_targets_min": 3017
},
{
"epoch": 1.0178981184029372,
"grad_norm": 0.49931300255816746,
"learning_rate": 3.8716779036107494e-05,
"loss": 0.5041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1491689383983612,
"step": 740,
"valid_targets_mean": 7294.2,
"valid_targets_min": 3200
},
{
"epoch": 1.0247820100963745,
"grad_norm": 0.3505316965796473,
"learning_rate": 3.8682714833967606e-05,
"loss": 0.4711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16744652390480042,
"step": 745,
"valid_targets_mean": 7212.2,
"valid_targets_min": 2554
},
{
"epoch": 1.0316659017898118,
"grad_norm": 0.29590178804551,
"learning_rate": 3.8648219790043086e-05,
"loss": 0.4479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15151597559452057,
"step": 750,
"valid_targets_mean": 7016.0,
"valid_targets_min": 2429
},
{
"epoch": 1.0385497934832493,
"grad_norm": 0.263662987853797,
"learning_rate": 3.86132946998236e-05,
"loss": 0.4401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13648268580436707,
"step": 755,
"valid_targets_mean": 7897.7,
"valid_targets_min": 2091
},
{
"epoch": 1.0454336851766866,
"grad_norm": 0.27437828717361396,
"learning_rate": 3.8577940368716076e-05,
"loss": 0.433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15187282860279083,
"step": 760,
"valid_targets_mean": 7362.4,
"valid_targets_min": 1674
},
{
"epoch": 1.0523175768701238,
"grad_norm": 0.27325212819692263,
"learning_rate": 3.8542157612026184e-05,
"loss": 0.4184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13746723532676697,
"step": 765,
"valid_targets_mean": 6896.6,
"valid_targets_min": 2522
},
{
"epoch": 1.0592014685635613,
"grad_norm": 0.23473196308314714,
"learning_rate": 3.850594725493949e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1299147754907608,
"step": 770,
"valid_targets_mean": 7470.7,
"valid_targets_min": 2790
},
{
"epoch": 1.0660853602569986,
"grad_norm": 0.28555087309472654,
"learning_rate": 3.846931013250246e-05,
"loss": 0.4132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14030131697654724,
"step": 775,
"valid_targets_mean": 8266.8,
"valid_targets_min": 3307
},
{
"epoch": 1.072969251950436,
"grad_norm": 0.23621951887818643,
"learning_rate": 3.8432247089603167e-05,
"loss": 0.4042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11525264382362366,
"step": 780,
"valid_targets_mean": 8286.0,
"valid_targets_min": 325
},
{
"epoch": 1.0798531436438734,
"grad_norm": 0.21450593319657246,
"learning_rate": 3.8394758980951864e-05,
"loss": 0.3895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13908235728740692,
"step": 785,
"valid_targets_mean": 9267.8,
"valid_targets_min": 5215
},
{
"epoch": 1.0867370353373107,
"grad_norm": 0.23844000544208796,
"learning_rate": 3.83568466710612e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12820349633693695,
"step": 790,
"valid_targets_mean": 9206.4,
"valid_targets_min": 3552
},
{
"epoch": 1.093620927030748,
"grad_norm": 0.2103809566833362,
"learning_rate": 3.8318511034226344e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13335391879081726,
"step": 795,
"valid_targets_mean": 9805.0,
"valid_targets_min": 435
},
{
"epoch": 1.1005048187241855,
"grad_norm": 0.23124182975495058,
"learning_rate": 3.8279752954504814e-05,
"loss": 0.3748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1326015442609787,
"step": 800,
"valid_targets_mean": 9971.8,
"valid_targets_min": 3896
},
{
"epoch": 1.1073887104176228,
"grad_norm": 0.23438818276332576,
"learning_rate": 3.824057332569604e-05,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12420172989368439,
"step": 805,
"valid_targets_mean": 9100.1,
"valid_targets_min": 3598
},
{
"epoch": 1.11427260211106,
"grad_norm": 0.24214472926654473,
"learning_rate": 3.820097305132081e-05,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12364979088306427,
"step": 810,
"valid_targets_mean": 9095.8,
"valid_targets_min": 3870
},
{
"epoch": 1.1211564938044976,
"grad_norm": 0.2218011971147791,
"learning_rate": 3.8160953044600426e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11890929937362671,
"step": 815,
"valid_targets_mean": 8719.1,
"valid_targets_min": 3803
},
{
"epoch": 1.1280403854979348,
"grad_norm": 0.2563084709321499,
"learning_rate": 3.81205142284356e-05,
"loss": 0.3606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12726369500160217,
"step": 820,
"valid_targets_mean": 9952.8,
"valid_targets_min": 703
},
{
"epoch": 1.1349242771913721,
"grad_norm": 0.22881759734160312,
"learning_rate": 3.807965753538522e-05,
"loss": 0.3648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12239524722099304,
"step": 825,
"valid_targets_mean": 9790.2,
"valid_targets_min": 1990
},
{
"epoch": 1.1418081688848096,
"grad_norm": 0.20713165564079833,
"learning_rate": 3.8038383907644834e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11979646980762482,
"step": 830,
"valid_targets_mean": 9145.0,
"valid_targets_min": 3036
},
{
"epoch": 1.148692060578247,
"grad_norm": 0.22499311166594924,
"learning_rate": 3.7996694297024895e-05,
"loss": 0.3578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1096620187163353,
"step": 835,
"valid_targets_mean": 9393.3,
"valid_targets_min": 749
},
{
"epoch": 1.1555759522716842,
"grad_norm": 0.21590056824128998,
"learning_rate": 3.795458966492884e-05,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10937801003456116,
"step": 840,
"valid_targets_mean": 8753.6,
"valid_targets_min": 721
},
{
"epoch": 1.1624598439651217,
"grad_norm": 0.22742334578308168,
"learning_rate": 3.7912070982330906e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1197114810347557,
"step": 845,
"valid_targets_mean": 9578.5,
"valid_targets_min": 2306
},
{
"epoch": 1.169343735658559,
"grad_norm": 0.2224738441211927,
"learning_rate": 3.786913922975375e-05,
"loss": 0.3634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11998347193002701,
"step": 850,
"valid_targets_mean": 9520.8,
"valid_targets_min": 4270
},
{
"epoch": 1.1762276273519963,
"grad_norm": 0.22538381825701656,
"learning_rate": 3.782579539724582e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12625733017921448,
"step": 855,
"valid_targets_mean": 10044.1,
"valid_targets_min": 5057
},
{
"epoch": 1.1831115190454338,
"grad_norm": 0.21800136414016363,
"learning_rate": 3.7782040484358547e-05,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1133735179901123,
"step": 860,
"valid_targets_mean": 9430.1,
"valid_targets_min": 4478
},
{
"epoch": 1.189995410738871,
"grad_norm": 0.21734230529243184,
"learning_rate": 3.773787550012325e-05,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11655744165182114,
"step": 865,
"valid_targets_mean": 9906.8,
"valid_targets_min": 4602
},
{
"epoch": 1.1968793024323083,
"grad_norm": 0.2263363296427952,
"learning_rate": 3.7693301463027935e-05,
"loss": 0.3507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12009304761886597,
"step": 870,
"valid_targets_mean": 9816.9,
"valid_targets_min": 600
},
{
"epoch": 1.2037631941257458,
"grad_norm": 0.23210893100009392,
"learning_rate": 3.764831940099374e-05,
"loss": 0.3563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11706417053937912,
"step": 875,
"valid_targets_mean": 9615.7,
"valid_targets_min": 321
},
{
"epoch": 1.2106470858191831,
"grad_norm": 0.1985963493513162,
"learning_rate": 3.760293035135127e-05,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11027579009532928,
"step": 880,
"valid_targets_mean": 9669.4,
"valid_targets_min": 4373
},
{
"epoch": 1.2175309775126204,
"grad_norm": 0.2247655964238049,
"learning_rate": 3.755713536081667e-05,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12357079982757568,
"step": 885,
"valid_targets_mean": 10030.3,
"valid_targets_min": 4760
},
{
"epoch": 1.224414869206058,
"grad_norm": 0.2459045345695429,
"learning_rate": 3.751093548546748e-05,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11696697026491165,
"step": 890,
"valid_targets_mean": 9881.2,
"valid_targets_min": 4785
},
{
"epoch": 1.2312987608994952,
"grad_norm": 0.22797315282104857,
"learning_rate": 3.7464331790718265e-05,
"loss": 0.3492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11382002383470535,
"step": 895,
"valid_targets_mean": 9669.7,
"valid_targets_min": 3932
},
{
"epoch": 1.2381826525929325,
"grad_norm": 0.19552476356000423,
"learning_rate": 3.7417325351296086e-05,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11515460908412933,
"step": 900,
"valid_targets_mean": 9425.6,
"valid_targets_min": 3063
},
{
"epoch": 1.24506654428637,
"grad_norm": 0.21705318540183,
"learning_rate": 3.736991725121567e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1254062056541443,
"step": 905,
"valid_targets_mean": 9942.2,
"valid_targets_min": 3468
},
{
"epoch": 1.2519504359798073,
"grad_norm": 0.21696447157131418,
"learning_rate": 3.732210858375447e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11086012423038483,
"step": 910,
"valid_targets_mean": 9693.8,
"valid_targets_min": 562
},
{
"epoch": 1.2588343276732445,
"grad_norm": 0.2169988687602966,
"learning_rate": 3.727390045142737e-05,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12142230570316315,
"step": 915,
"valid_targets_mean": 10011.0,
"valid_targets_min": 3774
},
{
"epoch": 1.2657182193666818,
"grad_norm": 0.22548894074150583,
"learning_rate": 3.722529396596133e-05,
"loss": 0.3473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08062661439180374,
"step": 920,
"valid_targets_mean": 5209.4,
"valid_targets_min": 484
},
{
"epoch": 1.2726021110601193,
"grad_norm": 0.2845110154034618,
"learning_rate": 3.717629024826974e-05,
"loss": 0.3733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12345914542675018,
"step": 925,
"valid_targets_mean": 6386.3,
"valid_targets_min": 3796
},
{
"epoch": 1.2794860027535566,
"grad_norm": 0.2968424819324445,
"learning_rate": 3.712689042842654e-05,
"loss": 0.374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14066240191459656,
"step": 930,
"valid_targets_mean": 6407.3,
"valid_targets_min": 2561
},
{
"epoch": 1.286369894446994,
"grad_norm": 0.6809334906683846,
"learning_rate": 3.707709564564017e-05,
"loss": 0.785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22839263081550598,
"step": 935,
"valid_targets_mean": 4497.1,
"valid_targets_min": 1348
},
{
"epoch": 1.2932537861404314,
"grad_norm": 0.44144670158983224,
"learning_rate": 3.70269070482273e-05,
"loss": 0.6665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18578793108463287,
"step": 940,
"valid_targets_mean": 4428.4,
"valid_targets_min": 1031
},
{
"epoch": 1.3001376778338687,
"grad_norm": 0.41426028869608567,
"learning_rate": 3.697632579358638e-05,
"loss": 0.6768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24046120047569275,
"step": 945,
"valid_targets_mean": 3730.1,
"valid_targets_min": 827
},
{
"epoch": 1.307021569527306,
"grad_norm": 0.29429169560205576,
"learning_rate": 3.69253530481709e-05,
"loss": 0.629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2377484142780304,
"step": 950,
"valid_targets_mean": 4497.8,
"valid_targets_min": 1422
},
{
"epoch": 1.3139054612207435,
"grad_norm": 0.32861368080088155,
"learning_rate": 3.687398998746252e-05,
"loss": 0.6108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17878547310829163,
"step": 955,
"valid_targets_mean": 2116.2,
"valid_targets_min": 785
},
{
"epoch": 1.3207893529141808,
"grad_norm": 0.26314724951089413,
"learning_rate": 3.6822237795943954e-05,
"loss": 0.606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1861293911933899,
"step": 960,
"valid_targets_mean": 4756.1,
"valid_targets_min": 1301
},
{
"epoch": 1.327673244607618,
"grad_norm": 0.2615679937645198,
"learning_rate": 3.6770097667071644e-05,
"loss": 0.596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18951809406280518,
"step": 965,
"valid_targets_mean": 4760.8,
"valid_targets_min": 758
},
{
"epoch": 1.3345571363010555,
"grad_norm": 0.26095009111284634,
"learning_rate": 3.671757080324826e-05,
"loss": 0.6175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2091958373785019,
"step": 970,
"valid_targets_mean": 3936.6,
"valid_targets_min": 1412
},
{
"epoch": 1.3414410279944928,
"grad_norm": 0.2776471727246407,
"learning_rate": 3.666465841579497e-05,
"loss": 0.5951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21168652176856995,
"step": 975,
"valid_targets_mean": 4049.9,
"valid_targets_min": 928
},
{
"epoch": 1.3483249196879301,
"grad_norm": 0.33267792860891676,
"learning_rate": 3.661136172492347e-05,
"loss": 0.5772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22148503363132477,
"step": 980,
"valid_targets_mean": 3266.9,
"valid_targets_min": 782
},
{
"epoch": 1.3552088113813676,
"grad_norm": 0.25102430709893414,
"learning_rate": 3.6557681959707905e-05,
"loss": 0.5882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19643747806549072,
"step": 985,
"valid_targets_mean": 4822.6,
"valid_targets_min": 1093
},
{
"epoch": 1.362092703074805,
"grad_norm": 0.26862571049180023,
"learning_rate": 3.6503620358056455e-05,
"loss": 0.5854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17380109429359436,
"step": 990,
"valid_targets_mean": 3932.0,
"valid_targets_min": 1179
},
{
"epoch": 1.3689765947682422,
"grad_norm": 0.287984411639415,
"learning_rate": 3.6449178166682846e-05,
"loss": 0.571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19724878668785095,
"step": 995,
"valid_targets_mean": 3117.2,
"valid_targets_min": 1152
},
{
"epoch": 1.3758604864616797,
"grad_norm": 0.2796683062977205,
"learning_rate": 3.639435664107758e-05,
"loss": 0.598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16841533780097961,
"step": 1000,
"valid_targets_mean": 3402.1,
"valid_targets_min": 1357
},
{
"epoch": 1.382744378155117,
"grad_norm": 0.4239174740835374,
"learning_rate": 3.633915704547897e-05,
"loss": 0.594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718241810798645,
"step": 1005,
"valid_targets_mean": 3427.9,
"valid_targets_min": 1115
},
{
"epoch": 1.3896282698485543,
"grad_norm": 0.2647039858767095,
"learning_rate": 3.628358065284399e-05,
"loss": 0.5874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17966550588607788,
"step": 1010,
"valid_targets_mean": 4640.0,
"valid_targets_min": 1563
},
{
"epoch": 1.3965121615419918,
"grad_norm": 0.2678172631650953,
"learning_rate": 3.6227628744818935e-05,
"loss": 0.5892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18576546013355255,
"step": 1015,
"valid_targets_mean": 3996.0,
"valid_targets_min": 1296
},
{
"epoch": 1.403396053235429,
"grad_norm": 0.317908066233358,
"learning_rate": 3.617130261170985e-05,
"loss": 0.5805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17968283593654633,
"step": 1020,
"valid_targets_mean": 3636.5,
"valid_targets_min": 1273
},
{
"epoch": 1.4102799449288663,
"grad_norm": 0.28706768200325383,
"learning_rate": 3.611460355245279e-05,
"loss": 0.6015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19896183907985687,
"step": 1025,
"valid_targets_mean": 3391.8,
"valid_targets_min": 1536
},
{
"epoch": 1.4171638366223038,
"grad_norm": 0.4445920863658933,
"learning_rate": 3.6057532874583825e-05,
"loss": 0.5255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340232938528061,
"step": 1030,
"valid_targets_mean": 5537.1,
"valid_targets_min": 2564
},
{
"epoch": 1.4240477283157411,
"grad_norm": 0.28330961789345677,
"learning_rate": 3.600009189420895e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06687448918819427,
"step": 1035,
"valid_targets_mean": 5478.3,
"valid_targets_min": 2226
},
{
"epoch": 1.4309316200091784,
"grad_norm": 0.22020183707384766,
"learning_rate": 3.594228193597369e-05,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052432358264923096,
"step": 1040,
"valid_targets_mean": 4935.5,
"valid_targets_min": 2518
},
{
"epoch": 1.437815511702616,
"grad_norm": 0.25073378136582336,
"learning_rate": 3.588410433303253e-05,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06154193356633186,
"step": 1045,
"valid_targets_mean": 5529.9,
"valid_targets_min": 3140
},
{
"epoch": 1.4446994033960532,
"grad_norm": 0.20180073452824873,
"learning_rate": 3.582556042701825e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05435199290513992,
"step": 1050,
"valid_targets_mean": 4935.2,
"valid_targets_min": 2984
},
{
"epoch": 1.4515832950894905,
"grad_norm": 0.23113035959905193,
"learning_rate": 3.5766651568010926e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05378912016749382,
"step": 1055,
"valid_targets_mean": 4934.8,
"valid_targets_min": 2648
},
{
"epoch": 1.458467186782928,
"grad_norm": 0.24237558785107005,
"learning_rate": 3.5707379114506785e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05625016614794731,
"step": 1060,
"valid_targets_mean": 5136.8,
"valid_targets_min": 2159
},
{
"epoch": 1.4653510784763653,
"grad_norm": 0.2162706048508137,
"learning_rate": 3.564774443338692e-05,
"loss": 0.1729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05345233902335167,
"step": 1065,
"valid_targets_mean": 5029.4,
"valid_targets_min": 2963
},
{
"epoch": 1.4722349701698025,
"grad_norm": 0.22973501526812276,
"learning_rate": 3.558774889988577e-05,
"loss": 0.1731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05721583217382431,
"step": 1070,
"valid_targets_mean": 5930.7,
"valid_targets_min": 2714
},
{
"epoch": 1.47911886186324,
"grad_norm": 0.20364094812823397,
"learning_rate": 3.552739389755934e-05,
"loss": 0.1673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052951518446207047,
"step": 1075,
"valid_targets_mean": 5439.3,
"valid_targets_min": 2668
},
{
"epoch": 1.4860027535566773,
"grad_norm": 0.1986389709515152,
"learning_rate": 3.546668081825337e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052483733743429184,
"step": 1080,
"valid_targets_mean": 5153.3,
"valid_targets_min": 2730
},
{
"epoch": 1.4928866452501146,
"grad_norm": 0.24482610765610374,
"learning_rate": 3.54056110620712e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06315732002258301,
"step": 1085,
"valid_targets_mean": 5870.0,
"valid_targets_min": 3065
},
{
"epoch": 1.4997705369435521,
"grad_norm": 0.20159556415367041,
"learning_rate": 3.534418603734149e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058553457260131836,
"step": 1090,
"valid_targets_mean": 5658.6,
"valid_targets_min": 2803
},
{
"epoch": 1.5066544286369894,
"grad_norm": 0.19181232874888832,
"learning_rate": 3.5282407160585736e-05,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052791528403759,
"step": 1095,
"valid_targets_mean": 5224.7,
"valid_targets_min": 2628
},
{
"epoch": 1.5135383203304267,
"grad_norm": 0.1976739120005175,
"learning_rate": 3.522027585648562e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0571698397397995,
"step": 1100,
"valid_targets_mean": 5735.1,
"valid_targets_min": 3533
},
{
"epoch": 1.5204222120238642,
"grad_norm": 0.21306112608703381,
"learning_rate": 3.515779355785015e-05,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052656762301921844,
"step": 1105,
"valid_targets_mean": 5265.8,
"valid_targets_min": 2050
},
{
"epoch": 1.5273061037173015,
"grad_norm": 0.22603016387768135,
"learning_rate": 3.50949617055826e-05,
"loss": 0.167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06061364710330963,
"step": 1110,
"valid_targets_mean": 5609.0,
"valid_targets_min": 3609
},
{
"epoch": 1.5341899954107387,
"grad_norm": 0.1980792666536461,
"learning_rate": 3.5031781748647286e-05,
"loss": 0.166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05426044017076492,
"step": 1115,
"valid_targets_mean": 5324.1,
"valid_targets_min": 1713
},
{
"epoch": 1.5410738871041763,
"grad_norm": 0.23644084395489454,
"learning_rate": 3.496825514403618e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05629802495241165,
"step": 1120,
"valid_targets_mean": 4990.3,
"valid_targets_min": 665
},
{
"epoch": 1.5479577787976135,
"grad_norm": 0.22755681790453738,
"learning_rate": 3.490438335673529e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05739838257431984,
"step": 1125,
"valid_targets_mean": 5599.9,
"valid_targets_min": 2657
},
{
"epoch": 1.5548416704910508,
"grad_norm": 0.19425963994466555,
"learning_rate": 3.484016785969087e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.055991411209106445,
"step": 1130,
"valid_targets_mean": 5342.1,
"valid_targets_min": 2880
},
{
"epoch": 1.5617255621844883,
"grad_norm": 0.5078671708098624,
"learning_rate": 3.4775610133775444e-05,
"loss": 0.3155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19734632968902588,
"step": 1135,
"valid_targets_mean": 3803.8,
"valid_targets_min": 1361
},
{
"epoch": 1.5686094538779256,
"grad_norm": 0.34030876024881695,
"learning_rate": 3.47107116677537e-05,
"loss": 0.5021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1680268496274948,
"step": 1140,
"valid_targets_mean": 4280.1,
"valid_targets_min": 341
},
{
"epoch": 1.575493345571363,
"grad_norm": 0.3386827436095329,
"learning_rate": 3.464547395824811e-05,
"loss": 0.4634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1324179768562317,
"step": 1145,
"valid_targets_mean": 4561.8,
"valid_targets_min": 1051
},
{
"epoch": 1.5823772372648004,
"grad_norm": 0.2926014105305259,
"learning_rate": 3.457989850970444e-05,
"loss": 0.513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17301608622074127,
"step": 1150,
"valid_targets_mean": 3689.7,
"valid_targets_min": 1235
},
{
"epoch": 1.5892611289582377,
"grad_norm": 0.27196678108600447,
"learning_rate": 3.451398683435704e-05,
"loss": 0.4809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14032022655010223,
"step": 1155,
"valid_targets_mean": 3426.4,
"valid_targets_min": 974
},
{
"epoch": 1.596145020651675,
"grad_norm": 0.3130005942988459,
"learning_rate": 3.4447740452193995e-05,
"loss": 0.4868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20944523811340332,
"step": 1160,
"valid_targets_mean": 3986.3,
"valid_targets_min": 1079
},
{
"epoch": 1.6030289123451125,
"grad_norm": 0.2717471489428658,
"learning_rate": 3.438116089092205e-05,
"loss": 0.4682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.139183908700943,
"step": 1165,
"valid_targets_mean": 3593.2,
"valid_targets_min": 926
},
{
"epoch": 1.6099128040385497,
"grad_norm": 0.27909638857698826,
"learning_rate": 3.43142496859314e-05,
"loss": 0.4608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13917654752731323,
"step": 1170,
"valid_targets_mean": 3480.5,
"valid_targets_min": 1151
},
{
"epoch": 1.616796695731987,
"grad_norm": 0.26768993562882953,
"learning_rate": 3.4247008380260244e-05,
"loss": 0.488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17577114701271057,
"step": 1175,
"valid_targets_mean": 3933.4,
"valid_targets_min": 1036
},
{
"epoch": 1.6236805874254245,
"grad_norm": 0.2932889829762393,
"learning_rate": 3.4179438524559255e-05,
"loss": 0.4728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15570342540740967,
"step": 1180,
"valid_targets_mean": 3254.5,
"valid_targets_min": 1190
},
{
"epoch": 1.6305644791188618,
"grad_norm": 0.24071768152710976,
"learning_rate": 3.411154167705578e-05,
"loss": 0.4511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1142294779419899,
"step": 1185,
"valid_targets_mean": 3184.5,
"valid_targets_min": 627
},
{
"epoch": 1.637448370812299,
"grad_norm": 0.2752558490458923,
"learning_rate": 3.404331940351793e-05,
"loss": 0.4907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14964590966701508,
"step": 1190,
"valid_targets_mean": 4686.7,
"valid_targets_min": 1218
},
{
"epoch": 1.6443322625057366,
"grad_norm": 0.2949052887253943,
"learning_rate": 3.397477327721844e-05,
"loss": 0.4596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17306478321552277,
"step": 1195,
"valid_targets_mean": 4532.6,
"valid_targets_min": 613
},
{
"epoch": 1.651216154199174,
"grad_norm": 0.28952244979890357,
"learning_rate": 3.390590487889842e-05,
"loss": 0.4909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15265388786792755,
"step": 1200,
"valid_targets_mean": 3717.2,
"valid_targets_min": 1137
},
{
"epoch": 1.6581000458926112,
"grad_norm": 0.3121644616582937,
"learning_rate": 3.38367157967309e-05,
"loss": 0.47,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1337219774723053,
"step": 1205,
"valid_targets_mean": 3432.2,
"valid_targets_min": 766
},
{
"epoch": 1.6649839375860487,
"grad_norm": 0.25739831721805007,
"learning_rate": 3.3767207626284184e-05,
"loss": 0.4744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17433468997478485,
"step": 1210,
"valid_targets_mean": 4030.4,
"valid_targets_min": 1035
},
{
"epoch": 1.671867829279486,
"grad_norm": 0.2998480779773187,
"learning_rate": 3.369738197048505e-05,
"loss": 0.4813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13764141499996185,
"step": 1215,
"valid_targets_mean": 3379.8,
"valid_targets_min": 1265
},
{
"epoch": 1.6787517209729232,
"grad_norm": 0.3600517795584768,
"learning_rate": 3.362724043958184e-05,
"loss": 0.4755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14118696749210358,
"step": 1220,
"valid_targets_mean": 2594.7,
"valid_targets_min": 1135
},
{
"epoch": 1.6856356126663607,
"grad_norm": 0.3194827365553974,
"learning_rate": 3.355678465110725e-05,
"loss": 0.4506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08822810649871826,
"step": 1225,
"valid_targets_mean": 972.6,
"valid_targets_min": 546
},
{
"epoch": 1.692519504359798,
"grad_norm": 0.2769855539856663,
"learning_rate": 3.348601622984107e-05,
"loss": 0.4816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1904619336128235,
"step": 1230,
"valid_targets_mean": 5099.9,
"valid_targets_min": 1465
},
{
"epoch": 1.6994033960532353,
"grad_norm": 0.2923413221945997,
"learning_rate": 3.3414936807772736e-05,
"loss": 0.4764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18333196640014648,
"step": 1235,
"valid_targets_mean": 5051.9,
"valid_targets_min": 986
},
{
"epoch": 1.7062872877466728,
"grad_norm": 0.39463221323145375,
"learning_rate": 3.334354802406364e-05,
"loss": 0.4142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11668369174003601,
"step": 1240,
"valid_targets_mean": 6354.4,
"valid_targets_min": 348
},
{
"epoch": 1.71317117944011,
"grad_norm": 0.29121380337364977,
"learning_rate": 3.327185152500937e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09022815525531769,
"step": 1245,
"valid_targets_mean": 6446.1,
"valid_targets_min": 139
},
{
"epoch": 1.7200550711335474,
"grad_norm": 0.2108193199124782,
"learning_rate": 3.3199848964001744e-05,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0786634087562561,
"step": 1250,
"valid_targets_mean": 3949.5,
"valid_targets_min": 306
},
{
"epoch": 1.726938962826985,
"grad_norm": 0.2164063397768852,
"learning_rate": 3.312754200149065e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10437431931495667,
"step": 1255,
"valid_targets_mean": 6445.5,
"valid_targets_min": 501
},
{
"epoch": 1.7338228545204222,
"grad_norm": 0.20918460158950558,
"learning_rate": 3.305493230494576e-05,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09302932769060135,
"step": 1260,
"valid_targets_mean": 6484.1,
"valid_targets_min": 702
},
{
"epoch": 1.7407067462138595,
"grad_norm": 0.20429734603153177,
"learning_rate": 3.298202154881814e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09457381814718246,
"step": 1265,
"valid_targets_mean": 7440.5,
"valid_targets_min": 914
},
{
"epoch": 1.747590637907297,
"grad_norm": 0.18234677362943436,
"learning_rate": 3.2908811414501545e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10430276393890381,
"step": 1270,
"valid_targets_mean": 7078.0,
"valid_targets_min": 280
},
{
"epoch": 1.7544745296007342,
"grad_norm": 0.24974357174847586,
"learning_rate": 3.283530359029369e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09898485243320465,
"step": 1275,
"valid_targets_mean": 6463.1,
"valid_targets_min": 1221
},
{
"epoch": 1.7613584212941715,
"grad_norm": 0.19176634782115026,
"learning_rate": 3.276149977135735e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07478626072406769,
"step": 1280,
"valid_targets_mean": 6061.8,
"valid_targets_min": 1412
},
{
"epoch": 1.768242312987609,
"grad_norm": 0.1999902463647874,
"learning_rate": 3.268740165968116e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11764705926179886,
"step": 1285,
"valid_targets_mean": 6472.4,
"valid_targets_min": 277
},
{
"epoch": 1.7751262046810463,
"grad_norm": 0.1789066747451937,
"learning_rate": 3.261301096404051e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07152275741100311,
"step": 1290,
"valid_targets_mean": 7596.1,
"valid_targets_min": 2298
},
{
"epoch": 1.7820100963744836,
"grad_norm": 0.1824655024569692,
"learning_rate": 3.2538329399958006e-05,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08981531858444214,
"step": 1295,
"valid_targets_mean": 7278.7,
"valid_targets_min": 299
},
{
"epoch": 1.788893988067921,
"grad_norm": 0.23888882746848344,
"learning_rate": 3.2463358689664e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10454994440078735,
"step": 1300,
"valid_targets_mean": 6472.9,
"valid_targets_min": 578
},
{
"epoch": 1.7957778797613584,
"grad_norm": 0.18924585287250698,
"learning_rate": 3.238810056205682e-05,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09392829984426498,
"step": 1305,
"valid_targets_mean": 6411.4,
"valid_targets_min": 176
},
{
"epoch": 1.8026617714547957,
"grad_norm": 0.1958691238588584,
"learning_rate": 3.2312556752662946e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10470084100961685,
"step": 1310,
"valid_targets_mean": 5064.2,
"valid_targets_min": 746
},
{
"epoch": 1.8095456631482332,
"grad_norm": 0.2170787439967381,
"learning_rate": 3.223672900359693e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11556200683116913,
"step": 1315,
"valid_targets_mean": 6593.2,
"valid_targets_min": 1045
},
{
"epoch": 1.8164295548416705,
"grad_norm": 0.1867201765991889,
"learning_rate": 3.2160619063521274e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07859818637371063,
"step": 1320,
"valid_targets_mean": 5822.4,
"valid_targets_min": 952
},
{
"epoch": 1.8233134465351077,
"grad_norm": 0.18138072725490167,
"learning_rate": 3.2084228687606076e-05,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12460223585367203,
"step": 1325,
"valid_targets_mean": 8131.2,
"valid_targets_min": 270
},
{
"epoch": 1.8301973382285452,
"grad_norm": 0.19754129821945798,
"learning_rate": 3.200755963748856e-05,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0860404372215271,
"step": 1330,
"valid_targets_mean": 6484.8,
"valid_targets_min": 1247
},
{
"epoch": 1.8370812299219825,
"grad_norm": 0.4698750684367156,
"learning_rate": 3.193061368123244e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11438726633787155,
"step": 1335,
"valid_targets_mean": 3920.8,
"valid_targets_min": 2348
},
{
"epoch": 1.8439651216154198,
"grad_norm": 0.2603830415640527,
"learning_rate": 3.185339259328718e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08097126334905624,
"step": 1340,
"valid_targets_mean": 4168.3,
"valid_targets_min": 1174
},
{
"epoch": 1.8508490133088573,
"grad_norm": 0.26754326662182265,
"learning_rate": 3.1775898154447035e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07933999598026276,
"step": 1345,
"valid_targets_mean": 3803.8,
"valid_targets_min": 1855
},
{
"epoch": 1.8577329050022946,
"grad_norm": 0.2627395021404963,
"learning_rate": 3.169813215181e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0736798420548439,
"step": 1350,
"valid_targets_mean": 4049.7,
"valid_targets_min": 2535
},
{
"epoch": 1.8646167966957319,
"grad_norm": 0.26403469391586964,
"learning_rate": 3.162009637873662e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07726424932479858,
"step": 1355,
"valid_targets_mean": 3835.0,
"valid_targets_min": 423
},
{
"epoch": 1.8715006883891694,
"grad_norm": 0.2252698294361399,
"learning_rate": 3.1541792634808586e-05,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07776709645986557,
"step": 1360,
"valid_targets_mean": 3791.8,
"valid_targets_min": 1366
},
{
"epoch": 1.8783845800826067,
"grad_norm": 0.21611929490789147,
"learning_rate": 3.146322272578726e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07243067771196365,
"step": 1365,
"valid_targets_mean": 3614.4,
"valid_targets_min": 452
},
{
"epoch": 1.885268471776044,
"grad_norm": 0.23385487665271673,
"learning_rate": 3.138438846357208e-05,
"loss": 0.2223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06762323528528214,
"step": 1370,
"valid_targets_mean": 3766.9,
"valid_targets_min": 505
},
{
"epoch": 1.8921523634694815,
"grad_norm": 0.26904239709962535,
"learning_rate": 3.1305291666158645e-05,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06977090984582901,
"step": 1375,
"valid_targets_mean": 3492.3,
"valid_targets_min": 289
},
{
"epoch": 1.8990362551629187,
"grad_norm": 0.25067490435632334,
"learning_rate": 3.1225934157596946e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07045575231313705,
"step": 1380,
"valid_targets_mean": 3381.6,
"valid_targets_min": 460
},
{
"epoch": 1.905920146856356,
"grad_norm": 0.2627943908553539,
"learning_rate": 3.1146317767949205e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07210519909858704,
"step": 1385,
"valid_targets_mean": 3726.1,
"valid_targets_min": 441
},
{
"epoch": 1.9128040385497935,
"grad_norm": 0.24210474794590595,
"learning_rate": 3.106644433324768e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05783864110708237,
"step": 1390,
"valid_targets_mean": 3206.2,
"valid_targets_min": 488
},
{
"epoch": 1.9196879302432308,
"grad_norm": 0.2788195303094242,
"learning_rate": 3.098631569545238e-05,
"loss": 0.2167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06336452066898346,
"step": 1395,
"valid_targets_mean": 3425.1,
"valid_targets_min": 454
},
{
"epoch": 1.926571821936668,
"grad_norm": 0.22849195239295697,
"learning_rate": 3.090593370240852e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07397540658712387,
"step": 1400,
"valid_targets_mean": 4109.9,
"valid_targets_min": 462
},
{
"epoch": 1.9334557136301056,
"grad_norm": 0.2409752826569829,
"learning_rate": 3.082530020780392e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06807292997837067,
"step": 1405,
"valid_targets_mean": 3850.9,
"valid_targets_min": 919
},
{
"epoch": 1.9403396053235429,
"grad_norm": 0.45451934745934763,
"learning_rate": 3.074441707112632e-05,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09514793753623962,
"step": 1410,
"valid_targets_mean": 6487.8,
"valid_targets_min": 453
},
{
"epoch": 1.9472234970169802,
"grad_norm": 0.31985575958658746,
"learning_rate": 3.0663286157620414e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0950220376253128,
"step": 1415,
"valid_targets_mean": 7570.3,
"valid_targets_min": 1928
},
{
"epoch": 1.9541073887104177,
"grad_norm": 0.28719145252156947,
"learning_rate": 3.058190933824489e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08216243982315063,
"step": 1420,
"valid_targets_mean": 6536.0,
"valid_targets_min": 386
},
{
"epoch": 1.960991280403855,
"grad_norm": 0.23128236961277554,
"learning_rate": 3.0500288489629263e-05,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08936893939971924,
"step": 1425,
"valid_targets_mean": 7177.7,
"valid_targets_min": 446
},
{
"epoch": 1.9678751720972922,
"grad_norm": 0.24609523942492573,
"learning_rate": 3.0418425494030596e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07563286274671555,
"step": 1430,
"valid_targets_mean": 6110.9,
"valid_targets_min": 321
},
{
"epoch": 1.9747590637907297,
"grad_norm": 0.24658402476334376,
"learning_rate": 3.0336322239290118e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08098824322223663,
"step": 1435,
"valid_targets_mean": 6657.7,
"valid_targets_min": 3389
},
{
"epoch": 1.981642955484167,
"grad_norm": 0.22318614135355666,
"learning_rate": 3.0253980618789654e-05,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07510203123092651,
"step": 1440,
"valid_targets_mean": 6613.5,
"valid_targets_min": 524
},
{
"epoch": 1.9885268471776043,
"grad_norm": 0.21078425849583504,
"learning_rate": 3.0171402531407982e-05,
"loss": 0.2431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0857941061258316,
"step": 1445,
"valid_targets_mean": 7165.2,
"valid_targets_min": 2065
},
{
"epoch": 1.9954107388710418,
"grad_norm": 0.22410382081565297,
"learning_rate": 3.008858988147704e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08800241351127625,
"step": 1450,
"valid_targets_mean": 6591.6,
"valid_targets_min": 155
},
{
"epoch": 2.0013767783386873,
"grad_norm": 2.6466904749858258,
"learning_rate": 3.0005544578738005e-05,
"loss": 0.3707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23792487382888794,
"step": 1455,
"valid_targets_mean": 7264.4,
"valid_targets_min": 1973
},
{
"epoch": 2.008260670032125,
"grad_norm": 0.9648943337750195,
"learning_rate": 2.9922268538297267e-05,
"loss": 0.5503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20204994082450867,
"step": 1460,
"valid_targets_mean": 9100.2,
"valid_targets_min": 3178
},
{
"epoch": 2.0151445617255623,
"grad_norm": 0.8297593468986739,
"learning_rate": 2.9838763680582247e-05,
"loss": 0.4629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14032147824764252,
"step": 1465,
"valid_targets_mean": 6959.6,
"valid_targets_min": 2166
},
{
"epoch": 2.0220284534189994,
"grad_norm": 0.3948957029510476,
"learning_rate": 2.9755031931297113e-05,
"loss": 0.4265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1425497829914093,
"step": 1470,
"valid_targets_mean": 7188.0,
"valid_targets_min": 2166
},
{
"epoch": 2.028912345112437,
"grad_norm": 0.2843596306589016,
"learning_rate": 2.9671075221378386e-05,
"loss": 0.3967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14745484292507172,
"step": 1475,
"valid_targets_mean": 6959.9,
"valid_targets_min": 2083
},
{
"epoch": 2.0357962368058744,
"grad_norm": 0.7483106688731904,
"learning_rate": 2.9586895486950387e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14458361268043518,
"step": 1480,
"valid_targets_mean": 7818.4,
"valid_targets_min": 2042
},
{
"epoch": 2.0426801284993115,
"grad_norm": 0.24953497116367615,
"learning_rate": 2.950249466928062e-05,
"loss": 0.3858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1309637874364853,
"step": 1485,
"valid_targets_mean": 7926.4,
"valid_targets_min": 3527
},
{
"epoch": 2.049564020192749,
"grad_norm": 0.23725116507324068,
"learning_rate": 2.9417874714734977e-05,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11365851759910583,
"step": 1490,
"valid_targets_mean": 6605.4,
"valid_targets_min": 2848
},
{
"epoch": 2.0564479118861865,
"grad_norm": 0.3158203272689995,
"learning_rate": 2.9333037574732847e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1223248615860939,
"step": 1495,
"valid_targets_mean": 6947.1,
"valid_targets_min": 2244
},
{
"epoch": 2.0633318035796235,
"grad_norm": 0.25112193214684,
"learning_rate": 2.9247985205702166e-05,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12720884382724762,
"step": 1500,
"valid_targets_mean": 7027.9,
"valid_targets_min": 340
},
{
"epoch": 2.070215695273061,
"grad_norm": 0.24375670298938254,
"learning_rate": 2.9162719569034216e-05,
"loss": 0.369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14586299657821655,
"step": 1505,
"valid_targets_mean": 8959.9,
"valid_targets_min": 3446
},
{
"epoch": 2.0770995869664985,
"grad_norm": 0.21230058397434262,
"learning_rate": 2.9077242631038487e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11099869012832642,
"step": 1510,
"valid_targets_mean": 9482.4,
"valid_targets_min": 5095
},
{
"epoch": 2.0839834786599356,
"grad_norm": 0.20509730804130927,
"learning_rate": 2.8991556362897248e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10739248991012573,
"step": 1515,
"valid_targets_mean": 8913.7,
"valid_targets_min": 251
},
{
"epoch": 2.090867370353373,
"grad_norm": 0.22226379394756782,
"learning_rate": 2.890566274062015e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11422709375619888,
"step": 1520,
"valid_targets_mean": 8780.3,
"valid_targets_min": 349
},
{
"epoch": 2.0977512620468106,
"grad_norm": 0.20071008297351936,
"learning_rate": 2.8819563744998626e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1113002598285675,
"step": 1525,
"valid_targets_mean": 9303.8,
"valid_targets_min": 773
},
{
"epoch": 2.1046351537402477,
"grad_norm": 0.20192807188862597,
"learning_rate": 2.8733261361560223e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10916690528392792,
"step": 1530,
"valid_targets_mean": 9819.0,
"valid_targets_min": 5584
},
{
"epoch": 2.111519045433685,
"grad_norm": 0.19824569692117233,
"learning_rate": 2.864675758052281e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11355476081371307,
"step": 1535,
"valid_targets_mean": 9100.7,
"valid_targets_min": 306
},
{
"epoch": 2.1184029371271227,
"grad_norm": 0.24406167259488418,
"learning_rate": 2.8560054396748673e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11132253706455231,
"step": 1540,
"valid_targets_mean": 9212.3,
"valid_targets_min": 378
},
{
"epoch": 2.1252868288205597,
"grad_norm": 0.20727883416494522,
"learning_rate": 2.8473153809698546e-05,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.098292276263237,
"step": 1545,
"valid_targets_mean": 8648.9,
"valid_targets_min": 1557
},
{
"epoch": 2.1321707205139973,
"grad_norm": 0.26662728617842596,
"learning_rate": 2.8386057823385446e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12168661504983902,
"step": 1550,
"valid_targets_mean": 10183.4,
"valid_targets_min": 3886
},
{
"epoch": 2.1390546122074348,
"grad_norm": 0.2278362271965239,
"learning_rate": 2.829876844632852e-05,
"loss": 0.3261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10494972765445709,
"step": 1555,
"valid_targets_mean": 9594.6,
"valid_targets_min": 344
},
{
"epoch": 2.145938503900872,
"grad_norm": 0.21689494772378176,
"learning_rate": 2.821128769150667e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1015724167227745,
"step": 1560,
"valid_targets_mean": 8928.9,
"valid_targets_min": 897
},
{
"epoch": 2.1528223955943093,
"grad_norm": 0.21647054727360174,
"learning_rate": 2.8123617576312167e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11096221953630447,
"step": 1565,
"valid_targets_mean": 9772.7,
"valid_targets_min": 3574
},
{
"epoch": 2.159706287287747,
"grad_norm": 0.22433319070414948,
"learning_rate": 2.8035760122504126e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1108248233795166,
"step": 1570,
"valid_targets_mean": 10406.6,
"valid_targets_min": 5877
},
{
"epoch": 2.166590178981184,
"grad_norm": 0.20015161510933208,
"learning_rate": 2.7947717356161867e-05,
"loss": 0.3265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11052754521369934,
"step": 1575,
"valid_targets_mean": 9535.4,
"valid_targets_min": 3557
},
{
"epoch": 2.1734740706746214,
"grad_norm": 0.2158786430865961,
"learning_rate": 2.78594913076382e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10300415754318237,
"step": 1580,
"valid_targets_mean": 9136.9,
"valid_targets_min": 1343
},
{
"epoch": 2.180357962368059,
"grad_norm": 0.18903953041106164,
"learning_rate": 2.7771084011512603e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09355498105287552,
"step": 1585,
"valid_targets_mean": 9388.7,
"valid_targets_min": 3282
},
{
"epoch": 2.187241854061496,
"grad_norm": 0.2308426422061156,
"learning_rate": 2.76824975065443e-05,
"loss": 0.3184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10470138490200043,
"step": 1590,
"valid_targets_mean": 9729.2,
"valid_targets_min": 3231
},
{
"epoch": 2.1941257457549335,
"grad_norm": 0.21713575495158471,
"learning_rate": 2.7593733835625246e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12001024186611176,
"step": 1595,
"valid_targets_mean": 10332.3,
"valid_targets_min": 4344
},
{
"epoch": 2.201009637448371,
"grad_norm": 0.18564762498854304,
"learning_rate": 2.750479504573303e-05,
"loss": 0.3241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11725566536188126,
"step": 1600,
"valid_targets_mean": 11408.0,
"valid_targets_min": 5726
},
{
"epoch": 2.207893529141808,
"grad_norm": 0.20551407108267855,
"learning_rate": 2.7415683187883647e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11440514028072357,
"step": 1605,
"valid_targets_mean": 10250.5,
"valid_targets_min": 2607
},
{
"epoch": 2.2147774208352455,
"grad_norm": 0.19505075166019809,
"learning_rate": 2.7326400317084202e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10536989569664001,
"step": 1610,
"valid_targets_mean": 9131.8,
"valid_targets_min": 761
},
{
"epoch": 2.221661312528683,
"grad_norm": 0.19443056596986627,
"learning_rate": 2.7236948492285535e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11025330424308777,
"step": 1615,
"valid_targets_mean": 10329.2,
"valid_targets_min": 5291
},
{
"epoch": 2.22854520422212,
"grad_norm": 0.2110434913158342,
"learning_rate": 2.7147329776334742e-05,
"loss": 0.3232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1029968410730362,
"step": 1620,
"valid_targets_mean": 8999.2,
"valid_targets_min": 2381
},
{
"epoch": 2.2354290959155576,
"grad_norm": 0.1987583998355825,
"learning_rate": 2.7057546235927565e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11397416889667511,
"step": 1625,
"valid_targets_mean": 9227.1,
"valid_targets_min": 437
},
{
"epoch": 2.242312987608995,
"grad_norm": 0.20249691334408507,
"learning_rate": 2.696759994156079e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10142004489898682,
"step": 1630,
"valid_targets_mean": 9084.0,
"valid_targets_min": 1451
},
{
"epoch": 2.249196879302432,
"grad_norm": 0.19109001564744665,
"learning_rate": 2.6877492967484447e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09147472679615021,
"step": 1635,
"valid_targets_mean": 9274.7,
"valid_targets_min": 4259
},
{
"epoch": 2.2560807709958697,
"grad_norm": 0.1973586040294035,
"learning_rate": 2.6787227391654025e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09772805124521255,
"step": 1640,
"valid_targets_mean": 8931.9,
"valid_targets_min": 410
},
{
"epoch": 2.262964662689307,
"grad_norm": 0.22153726074279795,
"learning_rate": 2.6696805295682487e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13094830513000488,
"step": 1645,
"valid_targets_mean": 11522.8,
"valid_targets_min": 620
},
{
"epoch": 2.2698485543827442,
"grad_norm": 0.25466761523016024,
"learning_rate": 2.660622876479234e-05,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11351979523897171,
"step": 1650,
"valid_targets_mean": 6154.2,
"valid_targets_min": 386
},
{
"epoch": 2.2767324460761817,
"grad_norm": 0.2803967972978861,
"learning_rate": 2.6515499887767495e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11425979435443878,
"step": 1655,
"valid_targets_mean": 6070.9,
"valid_targets_min": 2967
},
{
"epoch": 2.2836163377696193,
"grad_norm": 1.6466553952943501,
"learning_rate": 2.642462075690511e-05,
"loss": 0.6025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20921450853347778,
"step": 1660,
"valid_targets_mean": 3383.0,
"valid_targets_min": 1270
},
{
"epoch": 2.2905002294630563,
"grad_norm": 0.6287251863877925,
"learning_rate": 2.633359346796736e-05,
"loss": 0.6721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16572773456573486,
"step": 1665,
"valid_targets_mean": 2937.2,
"valid_targets_min": 1026
},
{
"epoch": 2.297384121156494,
"grad_norm": 0.49928140036251006,
"learning_rate": 2.6242420120133086e-05,
"loss": 0.6071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290330171585083,
"step": 1670,
"valid_targets_mean": 4071.6,
"valid_targets_min": 1539
},
{
"epoch": 2.3042680128499313,
"grad_norm": 0.38142909127873137,
"learning_rate": 2.615110281594938e-05,
"loss": 0.59,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19661152362823486,
"step": 1675,
"valid_targets_mean": 5239.0,
"valid_targets_min": 1739
},
{
"epoch": 2.3111519045433684,
"grad_norm": 0.3099380229416545,
"learning_rate": 2.6059643661283116e-05,
"loss": 0.5761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17346453666687012,
"step": 1680,
"valid_targets_mean": 4039.2,
"valid_targets_min": 1204
},
{
"epoch": 2.318035796236806,
"grad_norm": 0.30542809625015865,
"learning_rate": 2.5968044765272394e-05,
"loss": 0.5542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1582844853401184,
"step": 1685,
"valid_targets_mean": 3473.9,
"valid_targets_min": 1130
},
{
"epoch": 2.3249196879302434,
"grad_norm": 0.3051234978697733,
"learning_rate": 2.5876308240277857e-05,
"loss": 0.561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16743376851081848,
"step": 1690,
"valid_targets_mean": 3420.7,
"valid_targets_min": 891
},
{
"epoch": 2.3318035796236805,
"grad_norm": 0.3250560787056461,
"learning_rate": 2.578443620183403e-05,
"loss": 0.5461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24719908833503723,
"step": 1695,
"valid_targets_mean": 3772.6,
"valid_targets_min": 1497
},
{
"epoch": 2.338687471317118,
"grad_norm": 0.2660151177567861,
"learning_rate": 2.5692430768600512e-05,
"loss": 0.54,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17158254981040955,
"step": 1700,
"valid_targets_mean": 4168.5,
"valid_targets_min": 972
},
{
"epoch": 2.3455713630105555,
"grad_norm": 0.25544944955250865,
"learning_rate": 2.5600294062313103e-05,
"loss": 0.5428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1272633671760559,
"step": 1705,
"valid_targets_mean": 3252.4,
"valid_targets_min": 636
},
{
"epoch": 2.3524552547039925,
"grad_norm": 0.26750917864344126,
"learning_rate": 2.55080282077349e-05,
"loss": 0.5336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2098875492811203,
"step": 1710,
"valid_targets_mean": 4318.8,
"valid_targets_min": 1103
},
{
"epoch": 2.35933914639743,
"grad_norm": 0.26536069162137604,
"learning_rate": 2.5415635332607284e-05,
"loss": 0.5449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15961642563343048,
"step": 1715,
"valid_targets_mean": 3735.0,
"valid_targets_min": 1048
},
{
"epoch": 2.3662230380908675,
"grad_norm": 0.27381817984219636,
"learning_rate": 2.5323117567600845e-05,
"loss": 0.5188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22347742319107056,
"step": 1720,
"valid_targets_mean": 4098.8,
"valid_targets_min": 1319
},
{
"epoch": 2.3731069297843046,
"grad_norm": 0.2572874712994384,
"learning_rate": 2.523047704626628e-05,
"loss": 0.5298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16295018792152405,
"step": 1725,
"valid_targets_mean": 4343.0,
"valid_targets_min": 1454
},
{
"epoch": 2.379990821477742,
"grad_norm": 0.2724707677172288,
"learning_rate": 2.513771590498514e-05,
"loss": 0.5431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16079822182655334,
"step": 1730,
"valid_targets_mean": 3758.9,
"valid_targets_min": 1151
},
{
"epoch": 2.3868747131711796,
"grad_norm": 0.27991161433019873,
"learning_rate": 2.504483628292061e-05,
"loss": 0.5578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15567082166671753,
"step": 1735,
"valid_targets_mean": 3194.6,
"valid_targets_min": 994
},
{
"epoch": 2.3937586048646167,
"grad_norm": 0.2632081621333093,
"learning_rate": 2.4951840321968157e-05,
"loss": 0.5505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1653202325105667,
"step": 1740,
"valid_targets_mean": 3790.3,
"valid_targets_min": 1391
},
{
"epoch": 2.400642496558054,
"grad_norm": 0.27239266163390957,
"learning_rate": 2.4858730166706125e-05,
"loss": 0.5337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22418425977230072,
"step": 1745,
"valid_targets_mean": 4685.3,
"valid_targets_min": 822
},
{
"epoch": 2.4075263882514917,
"grad_norm": 0.2587574171184569,
"learning_rate": 2.47655079643463e-05,
"loss": 0.5376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14405536651611328,
"step": 1750,
"valid_targets_mean": 3750.0,
"valid_targets_min": 1314
},
{
"epoch": 2.4144102799449287,
"grad_norm": 0.2631506572474716,
"learning_rate": 2.467217586468438e-05,
"loss": 0.5434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17319154739379883,
"step": 1755,
"valid_targets_mean": 4435.8,
"valid_targets_min": 901
},
{
"epoch": 2.4212941716383662,
"grad_norm": 0.3163059805630689,
"learning_rate": 2.4578736020050423e-05,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05564213544130325,
"step": 1760,
"valid_targets_mean": 5312.0,
"valid_targets_min": 2490
},
{
"epoch": 2.4281780633318037,
"grad_norm": 0.28503436007188904,
"learning_rate": 2.448519058525915e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05835745483636856,
"step": 1765,
"valid_targets_mean": 5549.4,
"valid_targets_min": 3000
},
{
"epoch": 2.435061955025241,
"grad_norm": 0.26157242926928764,
"learning_rate": 2.4391541717560333e-05,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04818875715136528,
"step": 1770,
"valid_targets_mean": 5357.1,
"valid_targets_min": 2787
},
{
"epoch": 2.4419458467186783,
"grad_norm": 0.2023497066739585,
"learning_rate": 2.4297791576588993e-05,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06049264594912529,
"step": 1775,
"valid_targets_mean": 5853.2,
"valid_targets_min": 1305
},
{
"epoch": 2.448829738412116,
"grad_norm": 0.20086856688434088,
"learning_rate": 2.4203942324315623e-05,
"loss": 0.1489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04810313135385513,
"step": 1780,
"valid_targets_mean": 5323.5,
"valid_targets_min": 2609
},
{
"epoch": 2.455713630105553,
"grad_norm": 0.17236295233420956,
"learning_rate": 2.4109996124996297e-05,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05059269070625305,
"step": 1785,
"valid_targets_mean": 5320.9,
"valid_targets_min": 3076
},
{
"epoch": 2.4625975217989904,
"grad_norm": 0.18260197196728628,
"learning_rate": 2.4015955145122807e-05,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04599791020154953,
"step": 1790,
"valid_targets_mean": 5294.3,
"valid_targets_min": 1502
},
{
"epoch": 2.469481413492428,
"grad_norm": 0.20512227541440275,
"learning_rate": 2.3921821553372668e-05,
"loss": 0.1503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05129881948232651,
"step": 1795,
"valid_targets_mean": 5738.7,
"valid_targets_min": 3508
},
{
"epoch": 2.476365305185865,
"grad_norm": 0.19867031260793397,
"learning_rate": 2.3827597520559114e-05,
"loss": 0.1524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04662464186549187,
"step": 1800,
"valid_targets_mean": 5052.5,
"valid_targets_min": 2487
},
{
"epoch": 2.4832491968793025,
"grad_norm": 0.18169951666122502,
"learning_rate": 2.3733285219581044e-05,
"loss": 0.1423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04784727469086647,
"step": 1805,
"valid_targets_mean": 5108.5,
"valid_targets_min": 3236
},
{
"epoch": 2.49013308857274,
"grad_norm": 0.1804382758900024,
"learning_rate": 2.3638886825372905e-05,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0475069135427475,
"step": 1810,
"valid_targets_mean": 5397.8,
"valid_targets_min": 2803
},
{
"epoch": 2.497016980266177,
"grad_norm": 0.20004059160223273,
"learning_rate": 2.3544404514854546e-05,
"loss": 0.1462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046164870262145996,
"step": 1815,
"valid_targets_mean": 5513.7,
"valid_targets_min": 2867
},
{
"epoch": 2.5039008719596145,
"grad_norm": 0.219326819094649,
"learning_rate": 2.3449840466880982e-05,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04952413961291313,
"step": 1820,
"valid_targets_mean": 5217.7,
"valid_targets_min": 2433
},
{
"epoch": 2.510784763653052,
"grad_norm": 0.20249255196335733,
"learning_rate": 2.3355196862192217e-05,
"loss": 0.1401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04487111419439316,
"step": 1825,
"valid_targets_mean": 5169.1,
"valid_targets_min": 2789
},
{
"epoch": 2.517668655346489,
"grad_norm": 0.17956302100157867,
"learning_rate": 2.3260475883362875e-05,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0479186587035656,
"step": 1830,
"valid_targets_mean": 5809.1,
"valid_targets_min": 2841
},
{
"epoch": 2.5245525470399266,
"grad_norm": 0.19201673260015767,
"learning_rate": 2.316567971475192e-05,
"loss": 0.1457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05057358741760254,
"step": 1835,
"valid_targets_mean": 5502.1,
"valid_targets_min": 2911
},
{
"epoch": 2.5314364387333637,
"grad_norm": 0.20471095297210237,
"learning_rate": 2.307081054245226e-05,
"loss": 0.1431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0484449602663517,
"step": 1840,
"valid_targets_mean": 5274.9,
"valid_targets_min": 2672
},
{
"epoch": 2.538320330426801,
"grad_norm": 0.18776851268143915,
"learning_rate": 2.2975870554240355e-05,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.046514444053173065,
"step": 1845,
"valid_targets_mean": 4966.8,
"valid_targets_min": 2931
},
{
"epoch": 2.5452042221202387,
"grad_norm": 0.2093548275865132,
"learning_rate": 2.2880861939525723e-05,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05320793390274048,
"step": 1850,
"valid_targets_mean": 5898.0,
"valid_targets_min": 3337
},
{
"epoch": 2.552088113813676,
"grad_norm": 0.21043193594542342,
"learning_rate": 2.2785786889300497e-05,
"loss": 0.1411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.048174209892749786,
"step": 1855,
"valid_targets_mean": 5214.2,
"valid_targets_min": 2978
},
{
"epoch": 2.5589720055071132,
"grad_norm": 0.2562077072298455,
"learning_rate": 2.2690647596088874e-05,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09924779087305069,
"step": 1860,
"valid_targets_mean": 3851.8,
"valid_targets_min": 887
},
{
"epoch": 2.5658558972005507,
"grad_norm": 0.2663250390364335,
"learning_rate": 2.2595446253896554e-05,
"loss": 0.474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1439560055732727,
"step": 1865,
"valid_targets_mean": 4596.2,
"valid_targets_min": 1143
},
{
"epoch": 2.572739788893988,
"grad_norm": 0.2688731135078293,
"learning_rate": 2.250018505816015e-05,
"loss": 0.4627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1430397629737854,
"step": 1870,
"valid_targets_mean": 4087.0,
"valid_targets_min": 1058
},
{
"epoch": 2.5796236805874253,
"grad_norm": 0.31694294040387333,
"learning_rate": 2.2404866205696557e-05,
"loss": 0.452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1368146389722824,
"step": 1875,
"valid_targets_mean": 3146.8,
"valid_targets_min": 960
},
{
"epoch": 2.586507572280863,
"grad_norm": 0.2939674070397036,
"learning_rate": 2.2309491894652285e-05,
"loss": 0.4504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16308170557022095,
"step": 1880,
"valid_targets_mean": 4243.4,
"valid_targets_min": 890
},
{
"epoch": 2.5933914639743003,
"grad_norm": 0.2277866326879019,
"learning_rate": 2.2214064324452785e-05,
"loss": 0.4171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11347027122974396,
"step": 1885,
"valid_targets_mean": 4787.6,
"valid_targets_min": 989
},
{
"epoch": 2.6002753556677374,
"grad_norm": 0.2719922355168564,
"learning_rate": 2.2118585695751712e-05,
"loss": 0.4561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19940060377120972,
"step": 1890,
"valid_targets_mean": 4654.7,
"valid_targets_min": 385
},
{
"epoch": 2.607159247361175,
"grad_norm": 0.31742422458381,
"learning_rate": 2.202305821038017e-05,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1434064507484436,
"step": 1895,
"valid_targets_mean": 3702.7,
"valid_targets_min": 1391
},
{
"epoch": 2.614043139054612,
"grad_norm": 0.30176842670334525,
"learning_rate": 2.1927484071295965e-05,
"loss": 0.4208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1468219757080078,
"step": 1900,
"valid_targets_mean": 3575.6,
"valid_targets_min": 1115
},
{
"epoch": 2.6209270307480494,
"grad_norm": 0.24794596280960404,
"learning_rate": 2.1831865482532753e-05,
"loss": 0.4435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12187361717224121,
"step": 1905,
"valid_targets_mean": 3883.8,
"valid_targets_min": 1256
},
{
"epoch": 2.627810922441487,
"grad_norm": 0.2852241331128035,
"learning_rate": 2.173620464914929e-05,
"loss": 0.4286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12532787024974823,
"step": 1910,
"valid_targets_mean": 4064.0,
"valid_targets_min": 1346
},
{
"epoch": 2.6346948141349245,
"grad_norm": 0.31724825994333544,
"learning_rate": 2.1640503777178484e-05,
"loss": 0.4433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1480903923511505,
"step": 1915,
"valid_targets_mean": 3096.2,
"valid_targets_min": 695
},
{
"epoch": 2.6415787058283615,
"grad_norm": 0.26842526190523636,
"learning_rate": 2.154476507357661e-05,
"loss": 0.4216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14191970229148865,
"step": 1920,
"valid_targets_mean": 3573.1,
"valid_targets_min": 1272
},
{
"epoch": 2.648462597521799,
"grad_norm": 0.24591428355457226,
"learning_rate": 2.1448990746172353e-05,
"loss": 0.4188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298634558916092,
"step": 1925,
"valid_targets_mean": 4696.2,
"valid_targets_min": 939
},
{
"epoch": 2.655346489215236,
"grad_norm": 0.2586924114853833,
"learning_rate": 2.1353183003615944e-05,
"loss": 0.4675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18989674746990204,
"step": 1930,
"valid_targets_mean": 4314.5,
"valid_targets_min": 1135
},
{
"epoch": 2.6622303809086736,
"grad_norm": 0.2824215367703712,
"learning_rate": 2.1257344055328163e-05,
"loss": 0.4233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14473338425159454,
"step": 1935,
"valid_targets_mean": 3551.0,
"valid_targets_min": 909
},
{
"epoch": 2.669114272602111,
"grad_norm": 0.281092812644092,
"learning_rate": 2.1161476111449466e-05,
"loss": 0.4524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14296843111515045,
"step": 1940,
"valid_targets_mean": 3728.1,
"valid_targets_min": 970
},
{
"epoch": 2.6759981642955486,
"grad_norm": 0.2633497596047535,
"learning_rate": 2.106558138278894e-05,
"loss": 0.4234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11898775398731232,
"step": 1945,
"valid_targets_mean": 3462.3,
"valid_targets_min": 1420
},
{
"epoch": 2.6828820559889857,
"grad_norm": 0.2627345443724075,
"learning_rate": 2.0969662080773387e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13881132006645203,
"step": 1950,
"valid_targets_mean": 4587.7,
"valid_targets_min": 1133
},
{
"epoch": 2.689765947682423,
"grad_norm": 0.26816569681245367,
"learning_rate": 2.0873720417396265e-05,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12991484999656677,
"step": 1955,
"valid_targets_mean": 3638.8,
"valid_targets_min": 1166
},
{
"epoch": 2.6966498393758602,
"grad_norm": 0.25549945448822214,
"learning_rate": 2.0777758605166733e-05,
"loss": 0.4463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14429476857185364,
"step": 1960,
"valid_targets_mean": 4151.9,
"valid_targets_min": 1404
},
{
"epoch": 2.7035337310692977,
"grad_norm": 0.2661070040391692,
"learning_rate": 2.0681778857058584e-05,
"loss": 0.4209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0850117951631546,
"step": 1965,
"valid_targets_mean": 1979.0,
"valid_targets_min": 506
},
{
"epoch": 2.7104176227627352,
"grad_norm": 0.20166001158860308,
"learning_rate": 2.0585783386459242e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09919463843107224,
"step": 1970,
"valid_targets_mean": 6913.1,
"valid_targets_min": 817
},
{
"epoch": 2.7173015144561727,
"grad_norm": 0.21527235088365207,
"learning_rate": 2.0489774407118695e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09187182784080505,
"step": 1975,
"valid_targets_mean": 6177.3,
"valid_targets_min": 509
},
{
"epoch": 2.72418540614961,
"grad_norm": 0.19810833897696425,
"learning_rate": 2.039375413309847e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0892031192779541,
"step": 1980,
"valid_targets_mean": 6737.9,
"valid_targets_min": 1241
},
{
"epoch": 2.7310692978430473,
"grad_norm": 0.19012384443935784,
"learning_rate": 2.0297724778720553e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09897127747535706,
"step": 1985,
"valid_targets_mean": 7625.8,
"valid_targets_min": 597
},
{
"epoch": 2.7379531895364844,
"grad_norm": 0.2465631293054896,
"learning_rate": 2.0201688558516324e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13522624969482422,
"step": 1990,
"valid_targets_mean": 6605.6,
"valid_targets_min": 335
},
{
"epoch": 2.744837081229922,
"grad_norm": 0.19684510076736875,
"learning_rate": 2.0105647687175507e-05,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08646862208843231,
"step": 1995,
"valid_targets_mean": 6378.9,
"valid_targets_min": 281
},
{
"epoch": 2.7517209729233594,
"grad_norm": 0.1893668038549979,
"learning_rate": 2.000960437949509e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07368569076061249,
"step": 2000,
"valid_targets_mean": 5468.6,
"valid_targets_min": 543
},
{
"epoch": 2.758604864616797,
"grad_norm": 0.16937118963601522,
"learning_rate": 1.991356085032823e-05,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08165471255779266,
"step": 2005,
"valid_targets_mean": 6290.5,
"valid_targets_min": 301
},
{
"epoch": 2.765488756310234,
"grad_norm": 0.17417345586661112,
"learning_rate": 1.9817519314533203e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05768326669931412,
"step": 2010,
"valid_targets_mean": 4845.6,
"valid_targets_min": 401
},
{
"epoch": 2.7723726480036714,
"grad_norm": 0.18330526531977226,
"learning_rate": 1.9721481986922314e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08753426373004913,
"step": 2015,
"valid_targets_mean": 6736.4,
"valid_targets_min": 134
},
{
"epoch": 2.7792565396971085,
"grad_norm": 0.174366139502485,
"learning_rate": 1.9625451082210815e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09649921953678131,
"step": 2020,
"valid_targets_mean": 7333.2,
"valid_targets_min": 1427
},
{
"epoch": 2.786140431390546,
"grad_norm": 0.23761842585783033,
"learning_rate": 1.9529428814965855e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052613697946071625,
"step": 2025,
"valid_targets_mean": 1272.8,
"valid_targets_min": 374
},
{
"epoch": 2.7930243230839835,
"grad_norm": 0.17619680289425318,
"learning_rate": 1.9433417399555385e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08473365008831024,
"step": 2030,
"valid_targets_mean": 6596.2,
"valid_targets_min": 491
},
{
"epoch": 2.799908214777421,
"grad_norm": 0.17424767345113856,
"learning_rate": 1.93374190500971e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06102645769715309,
"step": 2035,
"valid_targets_mean": 5984.0,
"valid_targets_min": 350
},
{
"epoch": 2.806792106470858,
"grad_norm": 0.19023496668990852,
"learning_rate": 1.924143598040738e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09187609702348709,
"step": 2040,
"valid_targets_mean": 6808.1,
"valid_targets_min": 367
},
{
"epoch": 2.8136759981642956,
"grad_norm": 0.19414274218047128,
"learning_rate": 1.9145470403950246e-05,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09320957958698273,
"step": 2045,
"valid_targets_mean": 6776.0,
"valid_targets_min": 475
},
{
"epoch": 2.8205598898577326,
"grad_norm": 0.21805678499250258,
"learning_rate": 1.9049524533786306e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10997814685106277,
"step": 2050,
"valid_targets_mean": 7100.5,
"valid_targets_min": 370
},
{
"epoch": 2.82744378155117,
"grad_norm": 0.1923498241545188,
"learning_rate": 1.8953600582521733e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06720973551273346,
"step": 2055,
"valid_targets_mean": 5628.6,
"valid_targets_min": 503
},
{
"epoch": 2.8343276732446077,
"grad_norm": 0.1716392833907659,
"learning_rate": 1.8857700762257188e-05,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09128379821777344,
"step": 2060,
"valid_targets_mean": 6859.2,
"valid_targets_min": 578
},
{
"epoch": 2.841211564938045,
"grad_norm": 0.2612671468981132,
"learning_rate": 1.8761827284536894e-05,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07055749744176865,
"step": 2065,
"valid_targets_mean": 3765.6,
"valid_targets_min": 1393
},
{
"epoch": 2.8480954566314822,
"grad_norm": 0.26011044179693166,
"learning_rate": 1.8665982360297564e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0651964545249939,
"step": 2070,
"valid_targets_mean": 3591.2,
"valid_targets_min": 1507
},
{
"epoch": 2.8549793483249197,
"grad_norm": 0.2609222687498387,
"learning_rate": 1.8570168199817454e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05844973772764206,
"step": 2075,
"valid_targets_mean": 3575.5,
"valid_targets_min": 533
},
{
"epoch": 2.861863240018357,
"grad_norm": 0.26962687587535233,
"learning_rate": 1.8474387012665357e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0727514773607254,
"step": 2080,
"valid_targets_mean": 3438.5,
"valid_targets_min": 426
},
{
"epoch": 2.8687471317117943,
"grad_norm": 0.2348996563907632,
"learning_rate": 1.8378641007649686e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.058854710310697556,
"step": 2085,
"valid_targets_mean": 3471.2,
"valid_targets_min": 440
},
{
"epoch": 2.875631023405232,
"grad_norm": 0.24990418831063008,
"learning_rate": 1.8282932392767516e-05,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06448241323232651,
"step": 2090,
"valid_targets_mean": 3325.1,
"valid_targets_min": 712
},
{
"epoch": 2.8825149150986693,
"grad_norm": 0.23030694879818017,
"learning_rate": 1.8187263375153664e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.060683317482471466,
"step": 2095,
"valid_targets_mean": 3658.6,
"valid_targets_min": 448
},
{
"epoch": 2.8893988067921064,
"grad_norm": 0.23232648155318278,
"learning_rate": 1.809163616102981e-05,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06554745137691498,
"step": 2100,
"valid_targets_mean": 3833.8,
"valid_targets_min": 418
},
{
"epoch": 2.896282698485544,
"grad_norm": 0.25730041564114836,
"learning_rate": 1.799605295565357e-05,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06680840253829956,
"step": 2105,
"valid_targets_mean": 3820.5,
"valid_targets_min": 434
},
{
"epoch": 2.903166590178981,
"grad_norm": 0.22753368510563451,
"learning_rate": 1.7900515963267708e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06230275332927704,
"step": 2110,
"valid_targets_mean": 3828.8,
"valid_targets_min": 707
},
{
"epoch": 2.9100504818724184,
"grad_norm": 0.23769119372061534,
"learning_rate": 1.7805027387049266e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056608423590660095,
"step": 2115,
"valid_targets_mean": 3212.1,
"valid_targets_min": 402
},
{
"epoch": 2.916934373565856,
"grad_norm": 0.2446021340553814,
"learning_rate": 1.7709589429058756e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059441857039928436,
"step": 2120,
"valid_targets_mean": 3774.8,
"valid_targets_min": 390
},
{
"epoch": 2.9238182652592934,
"grad_norm": 0.23890540039137606,
"learning_rate": 1.761420429018937e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06359831988811493,
"step": 2125,
"valid_targets_mean": 3427.3,
"valid_targets_min": 269
},
{
"epoch": 2.9307021569527305,
"grad_norm": 0.23688083508729743,
"learning_rate": 1.7518874170116262e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06328218430280685,
"step": 2130,
"valid_targets_mean": 3810.5,
"valid_targets_min": 405
},
{
"epoch": 2.937586048646168,
"grad_norm": 0.24155127909279164,
"learning_rate": 1.742360126724579e-05,
"loss": 0.1925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06442797929048538,
"step": 2135,
"valid_targets_mean": 3882.4,
"valid_targets_min": 478
},
{
"epoch": 2.944469940339605,
"grad_norm": 0.3631819880378349,
"learning_rate": 1.732838777866483e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09788917005062103,
"step": 2140,
"valid_targets_mean": 6992.9,
"valid_targets_min": 347
},
{
"epoch": 2.9513538320330426,
"grad_norm": 0.3172950606636833,
"learning_rate": 1.7233235900090094e-05,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08133139461278915,
"step": 2145,
"valid_targets_mean": 6991.2,
"valid_targets_min": 301
},
{
"epoch": 2.95823772372648,
"grad_norm": 0.25813777821116024,
"learning_rate": 1.7138147825817516e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08661668747663498,
"step": 2150,
"valid_targets_mean": 7084.7,
"valid_targets_min": 231
},
{
"epoch": 2.9651216154199176,
"grad_norm": 0.2575657738469496,
"learning_rate": 1.7043125748671637e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.087073914706707,
"step": 2155,
"valid_targets_mean": 7077.1,
"valid_targets_min": 3319
},
{
"epoch": 2.9720055071133546,
"grad_norm": 0.2259993012650762,
"learning_rate": 1.6948171859955054e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08060729503631592,
"step": 2160,
"valid_targets_mean": 6901.2,
"valid_targets_min": 421
},
{
"epoch": 2.978889398806792,
"grad_norm": 0.21460575181010538,
"learning_rate": 1.6853288349397842e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07245530188083649,
"step": 2165,
"valid_targets_mean": 6402.1,
"valid_targets_min": 331
},
{
"epoch": 2.985773290500229,
"grad_norm": 0.26274959327700337,
"learning_rate": 1.675847740510712e-05,
"loss": 0.2275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07267634570598602,
"step": 2170,
"valid_targets_mean": 6595.1,
"valid_targets_min": 111
},
{
"epoch": 2.9926571821936667,
"grad_norm": 0.20507915627157383,
"learning_rate": 1.666374121351652e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07876935601234436,
"step": 2175,
"valid_targets_mean": 6902.3,
"valid_targets_min": 2196
},
{
"epoch": 2.9995410738871042,
"grad_norm": 0.2067208575198668,
"learning_rate": 1.6569081959335843e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0786517783999443,
"step": 2180,
"valid_targets_mean": 7013.4,
"valid_targets_min": 1068
},
{
"epoch": 3.0055071133547497,
"grad_norm": 1.47143463512981,
"learning_rate": 1.6474501825500617e-05,
"loss": 0.5678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17598947882652283,
"step": 2185,
"valid_targets_mean": 6954.8,
"valid_targets_min": 1761
},
{
"epoch": 3.0123910050481872,
"grad_norm": 0.8296001361456135,
"learning_rate": 1.6380002993121768e-05,
"loss": 0.4782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16915714740753174,
"step": 2190,
"valid_targets_mean": 8220.0,
"valid_targets_min": 2842
},
{
"epoch": 3.0192748967416247,
"grad_norm": 0.5343323686375032,
"learning_rate": 1.6285587641435347e-05,
"loss": 0.4252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12750446796417236,
"step": 2195,
"valid_targets_mean": 7166.5,
"valid_targets_min": 2501
},
{
"epoch": 3.026158788435062,
"grad_norm": 0.3998460344540367,
"learning_rate": 1.6191257947752254e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12517595291137695,
"step": 2200,
"valid_targets_mean": 6987.4,
"valid_targets_min": 1709
},
{
"epoch": 3.0330426801284993,
"grad_norm": 0.2685805910516251,
"learning_rate": 1.609701608740803e-05,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12631681561470032,
"step": 2205,
"valid_targets_mean": 7609.8,
"valid_targets_min": 2002
},
{
"epoch": 3.039926571821937,
"grad_norm": 0.24262874044823118,
"learning_rate": 1.6002864233712684e-05,
"loss": 0.3682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11692699790000916,
"step": 2210,
"valid_targets_mean": 7067.3,
"valid_targets_min": 2449
},
{
"epoch": 3.046810463515374,
"grad_norm": 0.23285762855561765,
"learning_rate": 1.5908804557900595e-05,
"loss": 0.3565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10911443829536438,
"step": 2215,
"valid_targets_mean": 7091.4,
"valid_targets_min": 2861
},
{
"epoch": 3.0536943552088114,
"grad_norm": 0.20546076130954244,
"learning_rate": 1.581483922908043e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1265745759010315,
"step": 2220,
"valid_targets_mean": 7742.7,
"valid_targets_min": 341
},
{
"epoch": 3.060578246902249,
"grad_norm": 0.22268477828232294,
"learning_rate": 1.572097041418512e-05,
"loss": 0.3502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1311422437429428,
"step": 2225,
"valid_targets_mean": 8509.0,
"valid_targets_min": 3043
},
{
"epoch": 3.067462138595686,
"grad_norm": 0.22540249838886647,
"learning_rate": 1.562720027792188e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11340901255607605,
"step": 2230,
"valid_targets_mean": 6931.7,
"valid_targets_min": 2360
},
{
"epoch": 3.0743460302891235,
"grad_norm": 0.19718354585484277,
"learning_rate": 1.55335309827223e-05,
"loss": 0.3357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10545062273740768,
"step": 2235,
"valid_targets_mean": 9712.0,
"valid_targets_min": 2685
},
{
"epoch": 3.081229921982561,
"grad_norm": 0.18725111683861656,
"learning_rate": 1.5439964688692497e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1086466908454895,
"step": 2240,
"valid_targets_mean": 9876.8,
"valid_targets_min": 387
},
{
"epoch": 3.088113813675998,
"grad_norm": 0.1845673546242831,
"learning_rate": 1.534650355356325e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10268598794937134,
"step": 2245,
"valid_targets_mean": 9530.9,
"valid_targets_min": 5556
},
{
"epoch": 3.0949977053694355,
"grad_norm": 0.19522776849842052,
"learning_rate": 1.5253149732640305e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10937610268592834,
"step": 2250,
"valid_targets_mean": 9594.7,
"valid_targets_min": 4603
},
{
"epoch": 3.101881597062873,
"grad_norm": 0.18222363325054514,
"learning_rate": 1.515990537875459e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10362711548805237,
"step": 2255,
"valid_targets_mean": 9466.0,
"valid_targets_min": 6389
},
{
"epoch": 3.10876548875631,
"grad_norm": 0.18401641053290826,
"learning_rate": 1.5066772642212657e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.102295882999897,
"step": 2260,
"valid_targets_mean": 9956.4,
"valid_targets_min": 4744
},
{
"epoch": 3.1156493804497476,
"grad_norm": 0.18509759714005736,
"learning_rate": 1.4973753670747033e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10919614136219025,
"step": 2265,
"valid_targets_mean": 9960.5,
"valid_targets_min": 6172
},
{
"epoch": 3.122533272143185,
"grad_norm": 0.19550761601783884,
"learning_rate": 1.4880850609466726e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10317480564117432,
"step": 2270,
"valid_targets_mean": 9848.8,
"valid_targets_min": 751
},
{
"epoch": 3.129417163836622,
"grad_norm": 0.18779537300856247,
"learning_rate": 1.478806560080771e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10043558478355408,
"step": 2275,
"valid_targets_mean": 9407.0,
"valid_targets_min": 2003
},
{
"epoch": 3.1363010555300597,
"grad_norm": 0.195833294224063,
"learning_rate": 1.469540078448358e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10033436119556427,
"step": 2280,
"valid_targets_mean": 9471.5,
"valid_targets_min": 4297
},
{
"epoch": 3.143184947223497,
"grad_norm": 0.19526343486199585,
"learning_rate": 1.4602858297436164e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10044103860855103,
"step": 2285,
"valid_targets_mean": 8577.6,
"valid_targets_min": 3933
},
{
"epoch": 3.1500688389169342,
"grad_norm": 0.19666326160932227,
"learning_rate": 1.451044027378627e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077999621629715,
"step": 2290,
"valid_targets_mean": 9960.7,
"valid_targets_min": 1490
},
{
"epoch": 3.1569527306103717,
"grad_norm": 0.1827729428333937,
"learning_rate": 1.441814884478443e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09793984144926071,
"step": 2295,
"valid_targets_mean": 9948.3,
"valid_targets_min": 3344
},
{
"epoch": 3.1638366223038092,
"grad_norm": 0.18754922066894553,
"learning_rate": 1.4325986138761803e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0920855700969696,
"step": 2300,
"valid_targets_mean": 9342.2,
"valid_targets_min": 3715
},
{
"epoch": 3.1707205139972463,
"grad_norm": 0.17968909828736596,
"learning_rate": 1.4233954281081057e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10528083145618439,
"step": 2305,
"valid_targets_mean": 9508.4,
"valid_targets_min": 434
},
{
"epoch": 3.177604405690684,
"grad_norm": 0.17574266851428197,
"learning_rate": 1.4142055394087386e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09850088506937027,
"step": 2310,
"valid_targets_mean": 9982.4,
"valid_targets_min": 3744
},
{
"epoch": 3.1844882973841213,
"grad_norm": 0.18508025791924973,
"learning_rate": 1.4050291597059529e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10291430354118347,
"step": 2315,
"valid_targets_mean": 9832.3,
"valid_targets_min": 5100
},
{
"epoch": 3.1913721890775584,
"grad_norm": 0.1792881281784299,
"learning_rate": 1.3958665006160921e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10465849936008453,
"step": 2320,
"valid_targets_mean": 10835.8,
"valid_targets_min": 2829
},
{
"epoch": 3.198256080770996,
"grad_norm": 0.20216865453090171,
"learning_rate": 1.3867177734390895e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09900674223899841,
"step": 2325,
"valid_targets_mean": 10256.2,
"valid_targets_min": 5379
},
{
"epoch": 3.2051399724644334,
"grad_norm": 0.1945776010645318,
"learning_rate": 1.3775831891535947e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08786694705486298,
"step": 2330,
"valid_targets_mean": 9251.9,
"valid_targets_min": 648
},
{
"epoch": 3.2120238641578704,
"grad_norm": 0.24172818869279109,
"learning_rate": 1.368462958412109e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10653791576623917,
"step": 2335,
"valid_targets_mean": 11007.1,
"valid_targets_min": 1456
},
{
"epoch": 3.218907755851308,
"grad_norm": 0.1898036433710197,
"learning_rate": 1.3593572915361243e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10172994434833527,
"step": 2340,
"valid_targets_mean": 9657.8,
"valid_targets_min": 2733
},
{
"epoch": 3.2257916475447455,
"grad_norm": 0.19332251447397075,
"learning_rate": 1.3502663985112788e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12016477435827255,
"step": 2345,
"valid_targets_mean": 10753.2,
"valid_targets_min": 5581
},
{
"epoch": 3.2326755392381825,
"grad_norm": 0.21510799857850824,
"learning_rate": 1.3411904889825084e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10003630071878433,
"step": 2350,
"valid_targets_mean": 9586.8,
"valid_targets_min": 3841
},
{
"epoch": 3.23955943093162,
"grad_norm": 0.18385705814635578,
"learning_rate": 1.3321297722492167e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09207296371459961,
"step": 2355,
"valid_targets_mean": 9004.5,
"valid_targets_min": 434
},
{
"epoch": 3.2464433226250575,
"grad_norm": 0.187556404915227,
"learning_rate": 1.323084457260445e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08947405964136124,
"step": 2360,
"valid_targets_mean": 9294.9,
"valid_targets_min": 4130
},
{
"epoch": 3.2533272143184946,
"grad_norm": 0.2005331130468604,
"learning_rate": 1.3140547526100562e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1010352075099945,
"step": 2365,
"valid_targets_mean": 10179.0,
"valid_targets_min": 4267
},
{
"epoch": 3.260211106011932,
"grad_norm": 0.1968597743990302,
"learning_rate": 1.3050408665319237e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08902589976787567,
"step": 2370,
"valid_targets_mean": 8532.7,
"valid_targets_min": 417
},
{
"epoch": 3.2670949977053696,
"grad_norm": 0.25214344550494583,
"learning_rate": 1.2960430068951288e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11159469187259674,
"step": 2375,
"valid_targets_mean": 6747.5,
"valid_targets_min": 401
},
{
"epoch": 3.2739788893988067,
"grad_norm": 0.25887393760787125,
"learning_rate": 1.2870613811991657e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10041764378547668,
"step": 2380,
"valid_targets_mean": 5423.5,
"valid_targets_min": 369
},
{
"epoch": 3.280862781092244,
"grad_norm": 2.2198067200851077,
"learning_rate": 1.2780961965691603e-05,
"loss": 0.4073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2686154842376709,
"step": 2385,
"valid_targets_mean": 3791.8,
"valid_targets_min": 1231
},
{
"epoch": 3.2877466727856817,
"grad_norm": 0.9924225603619974,
"learning_rate": 1.2691476597510898e-05,
"loss": 0.6873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2092369794845581,
"step": 2390,
"valid_targets_mean": 4159.7,
"valid_targets_min": 1267
},
{
"epoch": 3.2946305644791187,
"grad_norm": 0.5742567377325489,
"learning_rate": 1.2602159771070178e-05,
"loss": 0.6139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18377545475959778,
"step": 2395,
"valid_targets_mean": 3654.0,
"valid_targets_min": 1421
},
{
"epoch": 3.3015144561725562,
"grad_norm": 0.5576756466527528,
"learning_rate": 1.2513013546103335e-05,
"loss": 0.5911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16704589128494263,
"step": 2400,
"valid_targets_mean": 2945.1,
"valid_targets_min": 996
},
{
"epoch": 3.3083983478659937,
"grad_norm": 0.3074568996613724,
"learning_rate": 1.2424039978410005e-05,
"loss": 0.5589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1972390115261078,
"step": 2405,
"valid_targets_mean": 4179.1,
"valid_targets_min": 1183
},
{
"epoch": 3.315282239559431,
"grad_norm": 0.3032569694533608,
"learning_rate": 1.2335241119808203e-05,
"loss": 0.5219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1691218614578247,
"step": 2410,
"valid_targets_mean": 4048.5,
"valid_targets_min": 1297
},
{
"epoch": 3.3221661312528683,
"grad_norm": 0.2765510565360534,
"learning_rate": 1.2246619018086973e-05,
"loss": 0.511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16525253653526306,
"step": 2415,
"valid_targets_mean": 4272.8,
"valid_targets_min": 1187
},
{
"epoch": 3.329050022946306,
"grad_norm": 0.27395286901316585,
"learning_rate": 1.2158175716959178e-05,
"loss": 0.5239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2498304396867752,
"step": 2420,
"valid_targets_mean": 4842.6,
"valid_targets_min": 1298
},
{
"epoch": 3.335933914639743,
"grad_norm": 0.29231799803753794,
"learning_rate": 1.2069913256014336e-05,
"loss": 0.5106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.200586199760437,
"step": 2425,
"valid_targets_mean": 4255.8,
"valid_targets_min": 1314
},
{
"epoch": 3.3428178063331804,
"grad_norm": 0.27263355288284863,
"learning_rate": 1.1981833670671641e-05,
"loss": 0.5095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15810373425483704,
"step": 2430,
"valid_targets_mean": 4050.4,
"valid_targets_min": 1624
},
{
"epoch": 3.349701698026618,
"grad_norm": 0.2836133175960233,
"learning_rate": 1.1893938992132983e-05,
"loss": 0.4842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15525907278060913,
"step": 2435,
"valid_targets_mean": 3251.1,
"valid_targets_min": 1018
},
{
"epoch": 3.356585589720055,
"grad_norm": 0.26401709501959203,
"learning_rate": 1.1806231247336135e-05,
"loss": 0.4978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16985741257667542,
"step": 2440,
"valid_targets_mean": 3961.1,
"valid_targets_min": 1033
},
{
"epoch": 3.3634694814134924,
"grad_norm": 0.23776953582310714,
"learning_rate": 1.1718712458907961e-05,
"loss": 0.4965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18274521827697754,
"step": 2445,
"valid_targets_mean": 5018.0,
"valid_targets_min": 1101
},
{
"epoch": 3.37035337310693,
"grad_norm": 0.2640952890965296,
"learning_rate": 1.1631384645117831e-05,
"loss": 0.496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1817808896303177,
"step": 2450,
"valid_targets_mean": 4231.1,
"valid_targets_min": 1310
},
{
"epoch": 3.377237264800367,
"grad_norm": 0.28342473701431786,
"learning_rate": 1.154424981983106e-05,
"loss": 0.4972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1519908607006073,
"step": 2455,
"valid_targets_mean": 3704.2,
"valid_targets_min": 1093
},
{
"epoch": 3.3841211564938045,
"grad_norm": 0.2951557771645841,
"learning_rate": 1.1457309992462434e-05,
"loss": 0.5127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16076089441776276,
"step": 2460,
"valid_targets_mean": 3797.5,
"valid_targets_min": 1323
},
{
"epoch": 3.391005048187242,
"grad_norm": 0.2824279828368872,
"learning_rate": 1.1370567167929907e-05,
"loss": 0.5128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16737669706344604,
"step": 2465,
"valid_targets_mean": 3499.0,
"valid_targets_min": 665
},
{
"epoch": 3.397888939880679,
"grad_norm": 0.24191641839490738,
"learning_rate": 1.1284023346608345e-05,
"loss": 0.499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1770470142364502,
"step": 2470,
"valid_targets_mean": 5092.9,
"valid_targets_min": 1149
},
{
"epoch": 3.4047728315741166,
"grad_norm": 0.25812009589666846,
"learning_rate": 1.1197680524283428e-05,
"loss": 0.5082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2065732181072235,
"step": 2475,
"valid_targets_mean": 4786.8,
"valid_targets_min": 1492
},
{
"epoch": 3.411656723267554,
"grad_norm": 0.2609107313315737,
"learning_rate": 1.111154069210557e-05,
"loss": 0.5111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.170506551861763,
"step": 2480,
"valid_targets_mean": 4219.8,
"valid_targets_min": 776
},
{
"epoch": 3.418540614960991,
"grad_norm": 0.4001514854422285,
"learning_rate": 1.1025605836544067e-05,
"loss": 0.3907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06078251823782921,
"step": 2485,
"valid_targets_mean": 5702.6,
"valid_targets_min": 2936
},
{
"epoch": 3.4254245066544287,
"grad_norm": 0.24598853218943317,
"learning_rate": 1.0939877939341206e-05,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05165702477097511,
"step": 2490,
"valid_targets_mean": 5383.9,
"valid_targets_min": 3193
},
{
"epoch": 3.432308398347866,
"grad_norm": 0.21842227235626044,
"learning_rate": 1.0854358977466664e-05,
"loss": 0.1416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045272137969732285,
"step": 2495,
"valid_targets_mean": 5404.5,
"valid_targets_min": 3254
},
{
"epoch": 3.4391922900413032,
"grad_norm": 0.19248978802990788,
"learning_rate": 1.0769050923071813e-05,
"loss": 0.1404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04644084721803665,
"step": 2500,
"valid_targets_mean": 5669.6,
"valid_targets_min": 2339
},
{
"epoch": 3.4460761817347407,
"grad_norm": 0.18077746801671077,
"learning_rate": 1.0683955743444348e-05,
"loss": 0.1308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045123808085918427,
"step": 2505,
"valid_targets_mean": 5712.7,
"valid_targets_min": 2963
},
{
"epoch": 3.4529600734281782,
"grad_norm": 0.20884570432769242,
"learning_rate": 1.0599075400962793e-05,
"loss": 0.1343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042846180498600006,
"step": 2510,
"valid_targets_mean": 5044.9,
"valid_targets_min": 2759
},
{
"epoch": 3.4598439651216153,
"grad_norm": 0.18635172677850229,
"learning_rate": 1.0514411853051381e-05,
"loss": 0.1294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03951629251241684,
"step": 2515,
"valid_targets_mean": 5219.8,
"valid_targets_min": 2654
},
{
"epoch": 3.466727856815053,
"grad_norm": 0.16818273843917325,
"learning_rate": 1.0429967052134801e-05,
"loss": 0.1345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042340002954006195,
"step": 2520,
"valid_targets_mean": 5413.7,
"valid_targets_min": 3427
},
{
"epoch": 3.4736117485084903,
"grad_norm": 0.18228194282838256,
"learning_rate": 1.0345742945593269e-05,
"loss": 0.133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0403037965297699,
"step": 2525,
"valid_targets_mean": 5462.3,
"valid_targets_min": 3458
},
{
"epoch": 3.4804956402019274,
"grad_norm": 0.17851242713475587,
"learning_rate": 1.026174147571751e-05,
"loss": 0.1274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044752124696969986,
"step": 2530,
"valid_targets_mean": 5651.2,
"valid_targets_min": 2078
},
{
"epoch": 3.487379531895365,
"grad_norm": 0.20049056795095394,
"learning_rate": 1.0177964579664085e-05,
"loss": 0.125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03916207700967789,
"step": 2535,
"valid_targets_mean": 5431.2,
"valid_targets_min": 1278
},
{
"epoch": 3.4942634235888024,
"grad_norm": 0.18270835516537468,
"learning_rate": 1.0094414189410625e-05,
"loss": 0.1306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04059268906712532,
"step": 2540,
"valid_targets_mean": 5013.1,
"valid_targets_min": 2521
},
{
"epoch": 3.5011473152822394,
"grad_norm": 0.20034351958133112,
"learning_rate": 1.0011092231711346e-05,
"loss": 0.1257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037493303418159485,
"step": 2545,
"valid_targets_mean": 5014.3,
"valid_targets_min": 2703
},
{
"epoch": 3.508031206975677,
"grad_norm": 0.17491191759515393,
"learning_rate": 9.928000628052552e-06,
"loss": 0.1248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0384521521627903,
"step": 2550,
"valid_targets_mean": 5006.2,
"valid_targets_min": 2670
},
{
"epoch": 3.514915098669114,
"grad_norm": 0.18654968465114588,
"learning_rate": 9.845141294608378e-06,
"loss": 0.1254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04389902949333191,
"step": 2555,
"valid_targets_mean": 6038.5,
"valid_targets_min": 3631
},
{
"epoch": 3.5217989903625515,
"grad_norm": 0.18761525640500146,
"learning_rate": 9.762516142196563e-06,
"loss": 0.1251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045166172087192535,
"step": 2560,
"valid_targets_mean": 4937.4,
"valid_targets_min": 2598
},
{
"epoch": 3.528682882055989,
"grad_norm": 0.1849921246703477,
"learning_rate": 9.680127076234425e-06,
"loss": 0.1245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04124714434146881,
"step": 2565,
"valid_targets_mean": 5467.6,
"valid_targets_min": 2990
},
{
"epoch": 3.5355667737494265,
"grad_norm": 0.18437113306824465,
"learning_rate": 9.597975996694872e-06,
"loss": 0.1276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04236382991075516,
"step": 2570,
"valid_targets_mean": 5111.8,
"valid_targets_min": 2044
},
{
"epoch": 3.5424506654428636,
"grad_norm": 0.18573334202464706,
"learning_rate": 9.516064798062625e-06,
"loss": 0.1275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04364463686943054,
"step": 2575,
"valid_targets_mean": 5763.9,
"valid_targets_min": 2904
},
{
"epoch": 3.549334557136301,
"grad_norm": 0.1915027801445681,
"learning_rate": 9.434395369290499e-06,
"loss": 0.124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0378815159201622,
"step": 2580,
"valid_targets_mean": 4922.0,
"valid_targets_min": 2500
},
{
"epoch": 3.556218448829738,
"grad_norm": 0.19162396288341896,
"learning_rate": 9.35296959375589e-06,
"loss": 0.1229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03863206505775452,
"step": 2585,
"valid_targets_mean": 5118.9,
"valid_targets_min": 2923
},
{
"epoch": 3.5631023405231756,
"grad_norm": 0.5191629748207883,
"learning_rate": 9.271789349217278e-06,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13411441445350647,
"step": 2590,
"valid_targets_mean": 3042.4,
"valid_targets_min": 1100
},
{
"epoch": 3.569986232216613,
"grad_norm": 0.3085051395779566,
"learning_rate": 9.190856507770965e-06,
"loss": 0.4481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1711662858724594,
"step": 2595,
"valid_targets_mean": 4385.5,
"valid_targets_min": 891
},
{
"epoch": 3.5768701239100507,
"grad_norm": 0.4307024372042649,
"learning_rate": 9.11017293580791e-06,
"loss": 0.4122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13990041613578796,
"step": 2600,
"valid_targets_mean": 1813.8,
"valid_targets_min": 507
},
{
"epoch": 3.5837540156034877,
"grad_norm": 0.2657723985016283,
"learning_rate": 9.02974049397066e-06,
"loss": 0.4207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12291470170021057,
"step": 2605,
"valid_targets_mean": 3846.0,
"valid_targets_min": 1237
},
{
"epoch": 3.5906379072969252,
"grad_norm": 0.2615169033048777,
"learning_rate": 8.949561037110441e-06,
"loss": 0.4125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1354140192270279,
"step": 2610,
"valid_targets_mean": 4735.8,
"valid_targets_min": 910
},
{
"epoch": 3.5975217989903623,
"grad_norm": 0.28820899087310153,
"learning_rate": 8.869636414244432e-06,
"loss": 0.4018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12852361798286438,
"step": 2615,
"valid_targets_mean": 3882.9,
"valid_targets_min": 1176
},
{
"epoch": 3.6044056906838,
"grad_norm": 0.2842744225252841,
"learning_rate": 8.789968468513057e-06,
"loss": 0.4022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16103368997573853,
"step": 2620,
"valid_targets_mean": 4241.8,
"valid_targets_min": 1013
},
{
"epoch": 3.6112895823772373,
"grad_norm": 0.23028309888693424,
"learning_rate": 8.710559037137516e-06,
"loss": 0.3805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11136943101882935,
"step": 2625,
"valid_targets_mean": 4934.8,
"valid_targets_min": 1378
},
{
"epoch": 3.618173474070675,
"grad_norm": 0.27031546941287016,
"learning_rate": 8.631409951377442e-06,
"loss": 0.4201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14648756384849548,
"step": 2630,
"valid_targets_mean": 3635.7,
"valid_targets_min": 1162
},
{
"epoch": 3.625057365764112,
"grad_norm": 0.261440214703691,
"learning_rate": 8.552523036488605e-06,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11132633686065674,
"step": 2635,
"valid_targets_mean": 3513.8,
"valid_targets_min": 1441
},
{
"epoch": 3.6319412574575494,
"grad_norm": 0.34750801613748267,
"learning_rate": 8.47390011168088e-06,
"loss": 0.4035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25909337401390076,
"step": 2640,
"valid_targets_mean": 4413.0,
"valid_targets_min": 1233
},
{
"epoch": 3.6388251491509864,
"grad_norm": 0.25770762746792886,
"learning_rate": 8.395542990076256e-06,
"loss": 0.3975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10192108154296875,
"step": 2645,
"valid_targets_mean": 3737.7,
"valid_targets_min": 1650
},
{
"epoch": 3.645709040844424,
"grad_norm": 0.2420881480617191,
"learning_rate": 8.317453478667061e-06,
"loss": 0.3917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10463223606348038,
"step": 2650,
"valid_targets_mean": 3766.6,
"valid_targets_min": 1250
},
{
"epoch": 3.6525929325378614,
"grad_norm": 0.26662498322339967,
"learning_rate": 8.239633378274249e-06,
"loss": 0.4106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12207278609275818,
"step": 2655,
"valid_targets_mean": 3043.5,
"valid_targets_min": 1208
},
{
"epoch": 3.659476824231299,
"grad_norm": 0.2508023395017142,
"learning_rate": 8.162084483505892e-06,
"loss": 0.4167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14572551846504211,
"step": 2660,
"valid_targets_mean": 4615.1,
"valid_targets_min": 269
},
{
"epoch": 3.666360715924736,
"grad_norm": 0.23556631300518252,
"learning_rate": 8.084808582715795e-06,
"loss": 0.3892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1286328136920929,
"step": 2665,
"valid_targets_mean": 5172.2,
"valid_targets_min": 1589
},
{
"epoch": 3.6732446076181735,
"grad_norm": 0.26361055666988087,
"learning_rate": 8.007807457962272e-06,
"loss": 0.414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15162985026836395,
"step": 2670,
"valid_targets_mean": 4159.3,
"valid_targets_min": 1283
},
{
"epoch": 3.6801284993116106,
"grad_norm": 0.25764341984499367,
"learning_rate": 7.931082884966996e-06,
"loss": 0.402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14428415894508362,
"step": 2675,
"valid_targets_mean": 4058.6,
"valid_targets_min": 876
},
{
"epoch": 3.687012391005048,
"grad_norm": 0.2722663989969839,
"learning_rate": 7.854636633074128e-06,
"loss": 0.3874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17224925756454468,
"step": 2680,
"valid_targets_mean": 4401.0,
"valid_targets_min": 1349
},
{
"epoch": 3.6938962826984856,
"grad_norm": 0.25427623016618217,
"learning_rate": 7.778470465209417e-06,
"loss": 0.408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11766083538532257,
"step": 2685,
"valid_targets_mean": 3505.7,
"valid_targets_min": 809
},
{
"epoch": 3.700780174391923,
"grad_norm": 0.24889480025272662,
"learning_rate": 7.702586137839653e-06,
"loss": 0.4076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10833757370710373,
"step": 2690,
"valid_targets_mean": 3860.3,
"valid_targets_min": 602
},
{
"epoch": 3.70766406608536,
"grad_norm": 0.3707403029896572,
"learning_rate": 7.626985400932068e-06,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10806169360876083,
"step": 2695,
"valid_targets_mean": 8001.6,
"valid_targets_min": 1252
},
{
"epoch": 3.7145479577787976,
"grad_norm": 0.19669483141062702,
"learning_rate": 7.551669997914048e-06,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07481403648853302,
"step": 2700,
"valid_targets_mean": 6021.0,
"valid_targets_min": 389
},
{
"epoch": 3.7214318494722347,
"grad_norm": 0.23162368514613632,
"learning_rate": 7.47664166563286e-06,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11998644471168518,
"step": 2705,
"valid_targets_mean": 6741.6,
"valid_targets_min": 473
},
{
"epoch": 3.728315741165672,
"grad_norm": 0.17228834530698153,
"learning_rate": 7.401902134315684e-06,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06548772752285004,
"step": 2710,
"valid_targets_mean": 5457.3,
"valid_targets_min": 253
},
{
"epoch": 3.7351996328591097,
"grad_norm": 0.17408247867794982,
"learning_rate": 7.3274531275296265e-06,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08035491406917572,
"step": 2715,
"valid_targets_mean": 6283.3,
"valid_targets_min": 146
},
{
"epoch": 3.7420835245525472,
"grad_norm": 0.17974994899581664,
"learning_rate": 7.253296362142048e-06,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07769985496997833,
"step": 2720,
"valid_targets_mean": 6143.3,
"valid_targets_min": 233
},
{
"epoch": 3.7489674162459843,
"grad_norm": 0.1675477236149244,
"learning_rate": 7.179433548280892e-06,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06394631415605545,
"step": 2725,
"valid_targets_mean": 6087.1,
"valid_targets_min": 1118
},
{
"epoch": 3.755851307939422,
"grad_norm": 0.1733213132187292,
"learning_rate": 7.105866389295335e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07828719168901443,
"step": 2730,
"valid_targets_mean": 6520.0,
"valid_targets_min": 178
},
{
"epoch": 3.762735199632859,
"grad_norm": 0.1785269252204138,
"learning_rate": 7.032596581716422e-06,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08230659365653992,
"step": 2735,
"valid_targets_mean": 6715.5,
"valid_targets_min": 744
},
{
"epoch": 3.7696190913262964,
"grad_norm": 0.21946429665501535,
"learning_rate": 6.959625815218018e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.045567117631435394,
"step": 2740,
"valid_targets_mean": 1099.6,
"valid_targets_min": 316
},
{
"epoch": 3.776502983019734,
"grad_norm": 0.17397920116832125,
"learning_rate": 6.8869557725777836e-06,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05601717159152031,
"step": 2745,
"valid_targets_mean": 5019.2,
"valid_targets_min": 247
},
{
"epoch": 3.7833868747131714,
"grad_norm": 0.16751761187770453,
"learning_rate": 6.814588129638393e-06,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09275075793266296,
"step": 2750,
"valid_targets_mean": 7409.7,
"valid_targets_min": 1034
},
{
"epoch": 3.7902707664066084,
"grad_norm": 0.17280417479859242,
"learning_rate": 6.742524555268886e-06,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05152815580368042,
"step": 2755,
"valid_targets_mean": 4764.1,
"valid_targets_min": 243
},
{
"epoch": 3.797154658100046,
"grad_norm": 0.16496609026025888,
"learning_rate": 6.6707667113261956e-06,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08169304579496384,
"step": 2760,
"valid_targets_mean": 6958.2,
"valid_targets_min": 1080
},
{
"epoch": 3.804038549793483,
"grad_norm": 0.19327664164399166,
"learning_rate": 6.599316252616796e-06,
"loss": 0.2431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13077764213085175,
"step": 2765,
"valid_targets_mean": 7221.4,
"valid_targets_min": 405
},
{
"epoch": 3.8109224414869205,
"grad_norm": 0.17470660816395175,
"learning_rate": 6.528174826858553e-06,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09528367966413498,
"step": 2770,
"valid_targets_mean": 7585.1,
"valid_targets_min": 1495
},
{
"epoch": 3.817806333180358,
"grad_norm": 0.18482290478544883,
"learning_rate": 6.457344074642751e-06,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10286924988031387,
"step": 2775,
"valid_targets_mean": 6407.4,
"valid_targets_min": 201
},
{
"epoch": 3.8246902248737955,
"grad_norm": 0.1666475205795951,
"learning_rate": 6.386825629396209e-06,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06370923668146133,
"step": 2780,
"valid_targets_mean": 6268.8,
"valid_targets_min": 536
},
{
"epoch": 3.8315741165672326,
"grad_norm": 0.1812248617883446,
"learning_rate": 6.316621117343657e-06,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1033419668674469,
"step": 2785,
"valid_targets_mean": 6778.3,
"valid_targets_min": 674
},
{
"epoch": 3.83845800826067,
"grad_norm": 0.3434779028623829,
"learning_rate": 6.246732157470205e-06,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.057458698749542236,
"step": 2790,
"valid_targets_mean": 3450.3,
"valid_targets_min": 449
},
{
"epoch": 3.845341899954107,
"grad_norm": 0.2506659571430072,
"learning_rate": 6.177160361484038e-06,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05707380175590515,
"step": 2795,
"valid_targets_mean": 3540.6,
"valid_targets_min": 443
},
{
"epoch": 3.8522257916475446,
"grad_norm": 0.25559819516599763,
"learning_rate": 6.107907333779204e-06,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0660262405872345,
"step": 2800,
"valid_targets_mean": 3877.7,
"valid_targets_min": 388
},
{
"epoch": 3.859109683340982,
"grad_norm": 0.23529237449017507,
"learning_rate": 6.038974671398678e-06,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06375281512737274,
"step": 2805,
"valid_targets_mean": 4024.9,
"valid_targets_min": 1736
},
{
"epoch": 3.8659935750344196,
"grad_norm": 0.2643384345756322,
"learning_rate": 5.970363963997443e-06,
"loss": 0.1787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0625511109828949,
"step": 2810,
"valid_targets_mean": 3796.8,
"valid_targets_min": 551
},
{
"epoch": 3.8728774667278567,
"grad_norm": 0.2630480400208193,
"learning_rate": 5.902076793805933e-06,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06277286261320114,
"step": 2815,
"valid_targets_mean": 4011.0,
"valid_targets_min": 423
},
{
"epoch": 3.879761358421294,
"grad_norm": 0.2836202603651868,
"learning_rate": 5.834114735593464e-06,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06746001541614532,
"step": 2820,
"valid_targets_mean": 4130.9,
"valid_targets_min": 1201
},
{
"epoch": 3.8866452501147313,
"grad_norm": 0.2443667600066765,
"learning_rate": 5.766479356631971e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05533027648925781,
"step": 2825,
"valid_targets_mean": 3678.6,
"valid_targets_min": 538
},
{
"epoch": 3.893529141808169,
"grad_norm": 0.23675573830153043,
"learning_rate": 5.69917221665983e-06,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05468790978193283,
"step": 2830,
"valid_targets_mean": 3560.1,
"valid_targets_min": 475
},
{
"epoch": 3.9004130335016063,
"grad_norm": 0.2334249200769521,
"learning_rate": 5.632194867845906e-06,
"loss": 0.172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05852728337049484,
"step": 2835,
"valid_targets_mean": 3700.8,
"valid_targets_min": 1268
},
{
"epoch": 3.907296925195044,
"grad_norm": 0.24410413934950573,
"learning_rate": 5.5655488547537525e-06,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05753038823604584,
"step": 2840,
"valid_targets_mean": 3890.9,
"valid_targets_min": 1223
},
{
"epoch": 3.914180816888481,
"grad_norm": 0.24063324214163975,
"learning_rate": 5.499235714306013e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05531303212046623,
"step": 2845,
"valid_targets_mean": 3898.9,
"valid_targets_min": 1311
},
{
"epoch": 3.9210647085819184,
"grad_norm": 0.3744111376550879,
"learning_rate": 5.433256975748935e-06,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05198235064744949,
"step": 2850,
"valid_targets_mean": 3726.0,
"valid_targets_min": 452
},
{
"epoch": 3.9279486002753554,
"grad_norm": 0.23540898155652942,
"learning_rate": 5.367614160617147e-06,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.062141187489032745,
"step": 2855,
"valid_targets_mean": 3976.4,
"valid_targets_min": 496
},
{
"epoch": 3.934832491968793,
"grad_norm": 0.25445169989275357,
"learning_rate": 5.3023087826985395e-06,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05715780705213547,
"step": 2860,
"valid_targets_mean": 3581.7,
"valid_targets_min": 495
},
{
"epoch": 3.9417163836622304,
"grad_norm": 0.6096258105448606,
"learning_rate": 5.237342347999386e-06,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08614245802164078,
"step": 2865,
"valid_targets_mean": 6912.2,
"valid_targets_min": 1543
},
{
"epoch": 3.948600275355668,
"grad_norm": 0.36201237541972986,
"learning_rate": 5.1727163547095835e-06,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0755876824259758,
"step": 2870,
"valid_targets_mean": 6841.5,
"valid_targets_min": 453
},
{
"epoch": 3.955484167049105,
"grad_norm": 0.2473513142917225,
"learning_rate": 5.108432293168118e-06,
"loss": 0.2295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08236972987651825,
"step": 2875,
"valid_targets_mean": 7884.5,
"valid_targets_min": 924
},
{
"epoch": 3.9623680587425425,
"grad_norm": 0.254514479375607,
"learning_rate": 5.044491645828684e-06,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07513093948364258,
"step": 2880,
"valid_targets_mean": 6715.9,
"valid_targets_min": 367
},
{
"epoch": 3.9692519504359796,
"grad_norm": 0.24006908726730125,
"learning_rate": 4.980895887225529e-06,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05822212994098663,
"step": 2885,
"valid_targets_mean": 5647.7,
"valid_targets_min": 255
},
{
"epoch": 3.976135842129417,
"grad_norm": 0.2289050141214267,
"learning_rate": 4.917646483939405e-06,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.078819140791893,
"step": 2890,
"valid_targets_mean": 7380.5,
"valid_targets_min": 504
},
{
"epoch": 3.9830197338228546,
"grad_norm": 0.216564526739044,
"learning_rate": 4.85474489456379e-06,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06552626937627792,
"step": 2895,
"valid_targets_mean": 6277.5,
"valid_targets_min": 478
},
{
"epoch": 3.989903625516292,
"grad_norm": 0.1990891081128417,
"learning_rate": 4.792192569671202e-06,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06608976423740387,
"step": 2900,
"valid_targets_mean": 6117.1,
"valid_targets_min": 258
},
{
"epoch": 3.996787517209729,
"grad_norm": 0.1960679039089432,
"learning_rate": 4.7299909517798034e-06,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06078875809907913,
"step": 2905,
"valid_targets_mean": 5683.7,
"valid_targets_min": 364
},
{
"epoch": 4.002753556677375,
"grad_norm": 2.395952944498442,
"learning_rate": 4.668141475320096e-06,
"loss": 0.3927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16962723433971405,
"step": 2910,
"valid_targets_mean": 6370.5,
"valid_targets_min": 2089
},
{
"epoch": 4.009637448370812,
"grad_norm": 1.648670888994138,
"learning_rate": 4.6066455666018664e-06,
"loss": 0.5545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19499695301055908,
"step": 2915,
"valid_targets_mean": 7651.2,
"valid_targets_min": 2581
},
{
"epoch": 4.01652134006425,
"grad_norm": 0.9399053935552177,
"learning_rate": 4.5455046437812515e-06,
"loss": 0.4776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15764357149600983,
"step": 2920,
"valid_targets_mean": 7917.3,
"valid_targets_min": 2931
},
{
"epoch": 4.023405231757687,
"grad_norm": 0.6663207234555762,
"learning_rate": 4.4847201168280985e-06,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14368441700935364,
"step": 2925,
"valid_targets_mean": 7465.7,
"valid_targets_min": 1655
},
{
"epoch": 4.030289123451125,
"grad_norm": 0.5122623048638776,
"learning_rate": 4.42429338749339e-06,
"loss": 0.3812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11772125959396362,
"step": 2930,
"valid_targets_mean": 6986.5,
"valid_targets_min": 2745
},
{
"epoch": 4.037173015144562,
"grad_norm": 0.33779981131960823,
"learning_rate": 4.3642258492769685e-06,
"loss": 0.3676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10366019606590271,
"step": 2935,
"valid_targets_mean": 6226.8,
"valid_targets_min": 2078
},
{
"epoch": 4.044056906837999,
"grad_norm": 0.2703695467372586,
"learning_rate": 4.3045188873953506e-06,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10385061055421829,
"step": 2940,
"valid_targets_mean": 6504.0,
"valid_targets_min": 3466
},
{
"epoch": 4.050940798531436,
"grad_norm": 0.2448441853051352,
"learning_rate": 4.24517387874982e-06,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11456277221441269,
"step": 2945,
"valid_targets_mean": 7776.8,
"valid_targets_min": 2749
},
{
"epoch": 4.057824690224874,
"grad_norm": 0.21404234435367878,
"learning_rate": 4.186192191894656e-06,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09924231469631195,
"step": 2950,
"valid_targets_mean": 6354.8,
"valid_targets_min": 1941
},
{
"epoch": 4.064708581918311,
"grad_norm": 0.19782479723452737,
"learning_rate": 4.127575187005597e-06,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09340573847293854,
"step": 2955,
"valid_targets_mean": 6384.4,
"valid_targets_min": 2441
},
{
"epoch": 4.071592473611749,
"grad_norm": 0.19555802078655035,
"learning_rate": 4.069324215848438e-06,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11382173001766205,
"step": 2960,
"valid_targets_mean": 7465.9,
"valid_targets_min": 2228
},
{
"epoch": 4.078476365305185,
"grad_norm": 0.19204541810372228,
"learning_rate": 4.011440621747879e-06,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09361422061920166,
"step": 2965,
"valid_targets_mean": 8703.7,
"valid_targets_min": 4392
},
{
"epoch": 4.085360256998623,
"grad_norm": 0.17690580645771956,
"learning_rate": 3.953925739556556e-06,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09472465515136719,
"step": 2970,
"valid_targets_mean": 9525.9,
"valid_targets_min": 3807
},
{
"epoch": 4.09224414869206,
"grad_norm": 0.17538796102613904,
"learning_rate": 3.896780895624235e-06,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09817524254322052,
"step": 2975,
"valid_targets_mean": 8976.7,
"valid_targets_min": 2713
},
{
"epoch": 4.099128040385498,
"grad_norm": 0.16782987576999478,
"learning_rate": 3.840007407767235e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.100134938955307,
"step": 2980,
"valid_targets_mean": 9808.0,
"valid_targets_min": 5333
},
{
"epoch": 4.1060119320789354,
"grad_norm": 0.16950335218205084,
"learning_rate": 3.7836065852380355e-06,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09137974679470062,
"step": 2985,
"valid_targets_mean": 8583.8,
"valid_targets_min": 2662
},
{
"epoch": 4.112895823772373,
"grad_norm": 0.1699684602922145,
"learning_rate": 3.727579728695103e-06,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09598828107118607,
"step": 2990,
"valid_targets_mean": 8976.7,
"valid_targets_min": 899
},
{
"epoch": 4.1197797154658105,
"grad_norm": 0.16269551372279134,
"learning_rate": 3.671928130172864e-06,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0977531224489212,
"step": 2995,
"valid_targets_mean": 8862.6,
"valid_targets_min": 363
},
{
"epoch": 4.126663607159247,
"grad_norm": 0.16710826243141283,
"learning_rate": 3.6166530730519413e-06,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09829722344875336,
"step": 3000,
"valid_targets_mean": 9068.4,
"valid_targets_min": 532
},
{
"epoch": 4.133547498852685,
"grad_norm": 0.15910196663534398,
"learning_rate": 3.561755832029519e-06,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10500204563140869,
"step": 3005,
"valid_targets_mean": 10089.5,
"valid_targets_min": 5419
},
{
"epoch": 4.140431390546122,
"grad_norm": 0.17704030770547838,
"learning_rate": 3.5072376730899937e-06,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09301409870386124,
"step": 3010,
"valid_targets_mean": 9003.8,
"valid_targets_min": 387
},
{
"epoch": 4.14731528223956,
"grad_norm": 0.1710309935861551,
"learning_rate": 3.453099853475739e-06,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10229654610157013,
"step": 3015,
"valid_targets_mean": 10012.9,
"valid_targets_min": 5197
},
{
"epoch": 4.154199173932997,
"grad_norm": 0.16458596144589727,
"learning_rate": 3.3993436216581556e-06,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09989041090011597,
"step": 3020,
"valid_targets_mean": 9826.7,
"valid_targets_min": 464
},
{
"epoch": 4.161083065626434,
"grad_norm": 0.1621123955498612,
"learning_rate": 3.3459702173088114e-06,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08722086995840073,
"step": 3025,
"valid_targets_mean": 8842.1,
"valid_targets_min": 4239
},
{
"epoch": 4.167966957319871,
"grad_norm": 0.1623556063331001,
"learning_rate": 3.2929808712709364e-06,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08920854330062866,
"step": 3030,
"valid_targets_mean": 9048.3,
"valid_targets_min": 5085
},
{
"epoch": 4.174850849013309,
"grad_norm": 0.15731886013609803,
"learning_rate": 3.2403768055309782e-06,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09582354873418808,
"step": 3035,
"valid_targets_mean": 9484.0,
"valid_targets_min": 4512
},
{
"epoch": 4.181734740706746,
"grad_norm": 0.15101610768604282,
"learning_rate": 3.1881592331904486e-06,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09862025827169418,
"step": 3040,
"valid_targets_mean": 9844.3,
"valid_targets_min": 3863
},
{
"epoch": 4.188618632400184,
"grad_norm": 0.15623253593056888,
"learning_rate": 3.136329358437937e-06,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08751824498176575,
"step": 3045,
"valid_targets_mean": 9963.1,
"valid_targets_min": 5225
},
{
"epoch": 4.195502524093621,
"grad_norm": 0.16134010073160548,
"learning_rate": 3.084888376521349e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08784323185682297,
"step": 3050,
"valid_targets_mean": 9133.7,
"valid_targets_min": 2782
},
{
"epoch": 4.202386415787059,
"grad_norm": 0.16838974268135262,
"learning_rate": 3.033837473720329e-06,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10435424745082855,
"step": 3055,
"valid_targets_mean": 9841.2,
"valid_targets_min": 885
},
{
"epoch": 4.209270307480495,
"grad_norm": 0.16279332645708683,
"learning_rate": 2.9831778273189306e-06,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08671228587627411,
"step": 3060,
"valid_targets_mean": 9260.1,
"valid_targets_min": 378
},
{
"epoch": 4.216154199173933,
"grad_norm": 0.1825984338791435,
"learning_rate": 2.9329106055784364e-06,
"loss": 0.2929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09681597352027893,
"step": 3065,
"valid_targets_mean": 9212.2,
"valid_targets_min": 3467
},
{
"epoch": 4.22303809086737,
"grad_norm": 0.15677839672709085,
"learning_rate": 2.883036967710431e-06,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09850604832172394,
"step": 3070,
"valid_targets_mean": 10565.9,
"valid_targets_min": 723
},
{
"epoch": 4.229921982560808,
"grad_norm": 0.21256236658118818,
"learning_rate": 2.8335580638500703e-06,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09888806939125061,
"step": 3075,
"valid_targets_mean": 10235.8,
"valid_targets_min": 5141
},
{
"epoch": 4.236805874254245,
"grad_norm": 0.1652684573375055,
"learning_rate": 2.7844750350295635e-06,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10100476443767548,
"step": 3080,
"valid_targets_mean": 10594.5,
"valid_targets_min": 4701
},
{
"epoch": 4.243689765947682,
"grad_norm": 0.1713255908842138,
"learning_rate": 2.7357890131518395e-06,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08998183906078339,
"step": 3085,
"valid_targets_mean": 9161.7,
"valid_targets_min": 3022
},
{
"epoch": 4.2505736576411195,
"grad_norm": 0.16553307695173833,
"learning_rate": 2.6875011209644617e-06,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09085310250520706,
"step": 3090,
"valid_targets_mean": 9593.7,
"valid_targets_min": 5120
},
{
"epoch": 4.257457549334557,
"grad_norm": 0.17160681639906475,
"learning_rate": 2.639612472033726e-06,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08973085880279541,
"step": 3095,
"valid_targets_mean": 9896.2,
"valid_targets_min": 3759
},
{
"epoch": 4.2643414410279945,
"grad_norm": 0.16123604490750948,
"learning_rate": 2.592124170718999e-06,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09492038190364838,
"step": 3100,
"valid_targets_mean": 9676.5,
"valid_targets_min": 4171
},
{
"epoch": 4.271225332721432,
"grad_norm": 0.20844821277823775,
"learning_rate": 2.545037312147223e-06,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09212687611579895,
"step": 3105,
"valid_targets_mean": 6269.3,
"valid_targets_min": 470
},
{
"epoch": 4.2781092244148695,
"grad_norm": 0.2188431410916334,
"learning_rate": 2.4983529821876885e-06,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09872142970561981,
"step": 3110,
"valid_targets_mean": 6197.9,
"valid_targets_min": 350
},
{
"epoch": 4.284993116108307,
"grad_norm": 1.719226340993559,
"learning_rate": 2.4520722574269697e-06,
"loss": 0.6151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27690717577934265,
"step": 3115,
"valid_targets_mean": 5028.6,
"valid_targets_min": 935
},
{
"epoch": 4.291877007801744,
"grad_norm": 1.4178092966572517,
"learning_rate": 2.4061962051441113e-06,
"loss": 0.6474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19200366735458374,
"step": 3120,
"valid_targets_mean": 3933.0,
"valid_targets_min": 797
},
{
"epoch": 4.298760899495181,
"grad_norm": 0.987071906372295,
"learning_rate": 2.36072588328601e-06,
"loss": 0.6191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17249909043312073,
"step": 3125,
"valid_targets_mean": 3912.4,
"valid_targets_min": 1137
},
{
"epoch": 4.305644791188619,
"grad_norm": 0.6333455736156541,
"learning_rate": 2.31566234044303e-06,
"loss": 0.5633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948523372411728,
"step": 3130,
"valid_targets_mean": 3427.5,
"valid_targets_min": 570
},
{
"epoch": 4.312528682882056,
"grad_norm": 0.41971667810569413,
"learning_rate": 2.2710066158248025e-06,
"loss": 0.5424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1517712026834488,
"step": 3135,
"valid_targets_mean": 4285.9,
"valid_targets_min": 1385
},
{
"epoch": 4.319412574575494,
"grad_norm": 0.3805804910200558,
"learning_rate": 2.226759739236262e-06,
"loss": 0.517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19778530299663544,
"step": 3140,
"valid_targets_mean": 4571.2,
"valid_targets_min": 1195
},
{
"epoch": 4.32629646626893,
"grad_norm": 0.3279172632768147,
"learning_rate": 2.1829227310539245e-06,
"loss": 0.5062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1429353952407837,
"step": 3145,
"valid_targets_mean": 3360.0,
"valid_targets_min": 791
},
{
"epoch": 4.333180357962368,
"grad_norm": 0.30812203887995343,
"learning_rate": 2.1394966022023246e-06,
"loss": 0.506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15199241042137146,
"step": 3150,
"valid_targets_mean": 3748.8,
"valid_targets_min": 1312
},
{
"epoch": 4.340064249655805,
"grad_norm": 0.2681054596093381,
"learning_rate": 2.0964823541307157e-06,
"loss": 0.4878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21830233931541443,
"step": 3155,
"valid_targets_mean": 4315.9,
"valid_targets_min": 858
},
{
"epoch": 4.346948141349243,
"grad_norm": 0.23204534962247023,
"learning_rate": 2.0538809787899728e-06,
"loss": 0.4748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1714772880077362,
"step": 3160,
"valid_targets_mean": 5165.7,
"valid_targets_min": 1332
},
{
"epoch": 4.35383203304268,
"grad_norm": 0.25226657135645386,
"learning_rate": 2.0116934586097294e-06,
"loss": 0.4778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14213097095489502,
"step": 3165,
"valid_targets_mean": 4124.3,
"valid_targets_min": 1668
},
{
"epoch": 4.360715924736118,
"grad_norm": 0.2715861692969419,
"learning_rate": 1.9699207664757057e-06,
"loss": 0.4836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16056758165359497,
"step": 3170,
"valid_targets_mean": 4181.1,
"valid_targets_min": 897
},
{
"epoch": 4.367599816429555,
"grad_norm": 0.2602540839903562,
"learning_rate": 1.928563865707278e-06,
"loss": 0.458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.137937992811203,
"step": 3175,
"valid_targets_mean": 3683.8,
"valid_targets_min": 1300
},
{
"epoch": 4.374483708122992,
"grad_norm": 0.2559875333171663,
"learning_rate": 1.88762371003526e-06,
"loss": 0.4951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24103213846683502,
"step": 3180,
"valid_targets_mean": 4964.7,
"valid_targets_min": 906
},
{
"epoch": 4.381367599816429,
"grad_norm": 0.2349098552726344,
"learning_rate": 1.8471012435799317e-06,
"loss": 0.4678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16132110357284546,
"step": 3185,
"valid_targets_mean": 4663.9,
"valid_targets_min": 1014
},
{
"epoch": 4.388251491509867,
"grad_norm": 0.2367676970278582,
"learning_rate": 1.8069974008292246e-06,
"loss": 0.5026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1740289032459259,
"step": 3190,
"valid_targets_mean": 5404.8,
"valid_targets_min": 1229
},
{
"epoch": 4.395135383203304,
"grad_norm": 0.2414666913515072,
"learning_rate": 1.7673131066172233e-06,
"loss": 0.4813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14912189543247223,
"step": 3195,
"valid_targets_mean": 4281.5,
"valid_targets_min": 1057
},
{
"epoch": 4.402019274896742,
"grad_norm": 0.2522485667461358,
"learning_rate": 1.7280492761027767e-06,
"loss": 0.4806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18337562680244446,
"step": 3200,
"valid_targets_mean": 4570.4,
"valid_targets_min": 1376
},
{
"epoch": 4.408903166590179,
"grad_norm": 0.2513303316228368,
"learning_rate": 1.6892068147484563e-06,
"loss": 0.4986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18488086760044098,
"step": 3205,
"valid_targets_mean": 4505.6,
"valid_targets_min": 1222
},
{
"epoch": 4.415787058283616,
"grad_norm": 0.22856795174321398,
"learning_rate": 1.650786618299629e-06,
"loss": 0.4708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13014987111091614,
"step": 3210,
"valid_targets_mean": 4379.0,
"valid_targets_min": 558
},
{
"epoch": 4.422670949977054,
"grad_norm": 0.4103495629302222,
"learning_rate": 1.6127895727638354e-06,
"loss": 0.1883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05053357779979706,
"step": 3215,
"valid_targets_mean": 5018.2,
"valid_targets_min": 2523
},
{
"epoch": 4.429554841670491,
"grad_norm": 0.26594803976153025,
"learning_rate": 1.5752165543903108e-06,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04512697458267212,
"step": 3220,
"valid_targets_mean": 5262.3,
"valid_targets_min": 2967
},
{
"epoch": 4.436438733363929,
"grad_norm": 0.2128042462301709,
"learning_rate": 1.5380684296498372e-06,
"loss": 0.1348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03946739807724953,
"step": 3225,
"valid_targets_mean": 5112.8,
"valid_targets_min": 3095
},
{
"epoch": 4.443322625057366,
"grad_norm": 0.19728120260756227,
"learning_rate": 1.5013460552147119e-06,
"loss": 0.1295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03898797184228897,
"step": 3230,
"valid_targets_mean": 5352.1,
"valid_targets_min": 2034
},
{
"epoch": 4.450206516750804,
"grad_norm": 0.18576983317859747,
"learning_rate": 1.4650502779390285e-06,
"loss": 0.1247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04268582910299301,
"step": 3235,
"valid_targets_mean": 5610.1,
"valid_targets_min": 3069
},
{
"epoch": 4.45709040844424,
"grad_norm": 0.1864794932574978,
"learning_rate": 1.4291819348391034e-06,
"loss": 0.1256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040051594376564026,
"step": 3240,
"valid_targets_mean": 5206.3,
"valid_targets_min": 3294
},
{
"epoch": 4.463974300137678,
"grad_norm": 0.17482555966140143,
"learning_rate": 1.3937418530742287e-06,
"loss": 0.1235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.042181774973869324,
"step": 3245,
"valid_targets_mean": 5573.9,
"valid_targets_min": 1997
},
{
"epoch": 4.470858191831115,
"grad_norm": 0.18070571117324402,
"learning_rate": 1.3587308499275475e-06,
"loss": 0.1269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.043698303401470184,
"step": 3250,
"valid_targets_mean": 5469.3,
"valid_targets_min": 3506
},
{
"epoch": 4.477742083524553,
"grad_norm": 0.1643633780132126,
"learning_rate": 1.3241497327872476e-06,
"loss": 0.1206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.040100231766700745,
"step": 3255,
"valid_targets_mean": 5436.2,
"valid_targets_min": 2886
},
{
"epoch": 4.48462597521799,
"grad_norm": 0.17207536132396473,
"learning_rate": 1.2899992991279086e-06,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.044177521020174026,
"step": 3260,
"valid_targets_mean": 5540.5,
"valid_targets_min": 3229
},
{
"epoch": 4.491509866911427,
"grad_norm": 0.16766746009169853,
"learning_rate": 1.2562803364921261e-06,
"loss": 0.1193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.041511788964271545,
"step": 3265,
"valid_targets_mean": 5831.1,
"valid_targets_min": 2745
},
{
"epoch": 4.498393758604864,
"grad_norm": 0.17030163346260857,
"learning_rate": 1.2229936224723483e-06,
"loss": 0.1191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03760635852813721,
"step": 3270,
"valid_targets_mean": 5347.5,
"valid_targets_min": 2417
},
{
"epoch": 4.505277650298302,
"grad_norm": 0.17085424627308554,
"learning_rate": 1.190139924692959e-06,
"loss": 0.1185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03664751350879669,
"step": 3275,
"valid_targets_mean": 5258.5,
"valid_targets_min": 720
},
{
"epoch": 4.512161541991739,
"grad_norm": 0.17522494699655267,
"learning_rate": 1.157720000792546e-06,
"loss": 0.1141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037477195262908936,
"step": 3280,
"valid_targets_mean": 5099.8,
"valid_targets_min": 1583
},
{
"epoch": 4.519045433685177,
"grad_norm": 0.17379587981619676,
"learning_rate": 1.125734598406447e-06,
"loss": 0.1148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04031280428171158,
"step": 3285,
"valid_targets_mean": 5578.4,
"valid_targets_min": 2798
},
{
"epoch": 4.525929325378614,
"grad_norm": 0.1695852085710305,
"learning_rate": 1.0941844551495162e-06,
"loss": 0.1159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03369366377592087,
"step": 3290,
"valid_targets_mean": 5036.6,
"valid_targets_min": 2310
},
{
"epoch": 4.532813217072052,
"grad_norm": 0.1786118550797064,
"learning_rate": 1.0630702985990914e-06,
"loss": 0.1169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03811822086572647,
"step": 3295,
"valid_targets_mean": 5270.8,
"valid_targets_min": 2978
},
{
"epoch": 4.5396971087654885,
"grad_norm": 0.16549826571880374,
"learning_rate": 1.0323928462782363e-06,
"loss": 0.116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.03811001777648926,
"step": 3300,
"valid_targets_mean": 5462.3,
"valid_targets_min": 2571
},
{
"epoch": 4.546581000458926,
"grad_norm": 0.16459854028246523,
"learning_rate": 1.0021528056391782e-06,
"loss": 0.117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.034841179847717285,
"step": 3305,
"valid_targets_mean": 5422.2,
"valid_targets_min": 2689
},
{
"epoch": 4.5534648921523635,
"grad_norm": 0.17263786107418352,
"learning_rate": 9.723508740470123e-07,
"loss": 0.1115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.037016794085502625,
"step": 3310,
"valid_targets_mean": 5195.3,
"valid_targets_min": 3110
},
{
"epoch": 4.560348783845801,
"grad_norm": 0.6697689536803294,
"learning_rate": 9.429877387635944e-07,
"loss": 0.1947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16726571321487427,
"step": 3315,
"valid_targets_mean": 3959.7,
"valid_targets_min": 1023
},
{
"epoch": 4.5672326755392385,
"grad_norm": 0.5264114313853077,
"learning_rate": 9.140640769317177e-07,
"loss": 0.4262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12650127708911896,
"step": 3320,
"valid_targets_mean": 3057.9,
"valid_targets_min": 1066
},
{
"epoch": 4.574116567232675,
"grad_norm": 0.392961284141338,
"learning_rate": 8.855805555594777e-07,
"loss": 0.4177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11679504811763763,
"step": 3325,
"valid_targets_mean": 4226.2,
"valid_targets_min": 902
},
{
"epoch": 4.581000458926113,
"grad_norm": 0.3220633125591813,
"learning_rate": 8.575378315048999e-07,
"loss": 0.4132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1164650171995163,
"step": 3330,
"valid_targets_mean": 3537.5,
"valid_targets_min": 1090
},
{
"epoch": 4.58788435061955,
"grad_norm": 0.2836347059693572,
"learning_rate": 8.299365514607883e-07,
"loss": 0.4073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11003822088241577,
"step": 3335,
"valid_targets_mean": 3058.2,
"valid_targets_min": 771
},
{
"epoch": 4.594768242312988,
"grad_norm": 0.3923630777914454,
"learning_rate": 8.027773519398207e-07,
"loss": 0.3835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12148011475801468,
"step": 3340,
"valid_targets_mean": 1120.0,
"valid_targets_min": 521
},
{
"epoch": 4.601652134006425,
"grad_norm": 0.23198120955974,
"learning_rate": 7.760608592598528e-07,
"loss": 0.3943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13927549123764038,
"step": 3345,
"valid_targets_mean": 4731.8,
"valid_targets_min": 1389
},
{
"epoch": 4.608536025699863,
"grad_norm": 0.2175553487141594,
"learning_rate": 7.497876895294931e-07,
"loss": 0.3707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1311253309249878,
"step": 3350,
"valid_targets_mean": 4816.6,
"valid_targets_min": 1341
},
{
"epoch": 4.6154199173933,
"grad_norm": 0.2523032181271898,
"learning_rate": 7.239584486338814e-07,
"loss": 0.392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12201976776123047,
"step": 3355,
"valid_targets_mean": 3374.7,
"valid_targets_min": 1239
},
{
"epoch": 4.622303809086737,
"grad_norm": 0.26995208568046913,
"learning_rate": 6.985737322207287e-07,
"loss": 0.3859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13418743014335632,
"step": 3360,
"valid_targets_mean": 3214.4,
"valid_targets_min": 621
},
{
"epoch": 4.629187700780174,
"grad_norm": 0.23355543900054457,
"learning_rate": 6.736341256865642e-07,
"loss": 0.3797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14379887282848358,
"step": 3365,
"valid_targets_mean": 5321.0,
"valid_targets_min": 1407
},
{
"epoch": 4.636071592473612,
"grad_norm": 0.2535456585399873,
"learning_rate": 6.491402041632544e-07,
"loss": 0.3888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11921147257089615,
"step": 3370,
"valid_targets_mean": 3536.7,
"valid_targets_min": 915
},
{
"epoch": 4.642955484167049,
"grad_norm": 0.2559436028551804,
"learning_rate": 6.250925325047252e-07,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09919558465480804,
"step": 3375,
"valid_targets_mean": 2772.1,
"valid_targets_min": 1106
},
{
"epoch": 4.649839375860487,
"grad_norm": 0.42012443586849063,
"learning_rate": 6.014916652739455e-07,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22293120622634888,
"step": 3380,
"valid_targets_mean": 3487.8,
"valid_targets_min": 523
},
{
"epoch": 4.656723267553923,
"grad_norm": 0.2264938566466451,
"learning_rate": 5.783381467301352e-07,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11772520840167999,
"step": 3385,
"valid_targets_mean": 4307.9,
"valid_targets_min": 1207
},
{
"epoch": 4.663607159247361,
"grad_norm": 0.23133653644845747,
"learning_rate": 5.556325108162064e-07,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14393877983093262,
"step": 3390,
"valid_targets_mean": 4449.8,
"valid_targets_min": 1036
},
{
"epoch": 4.670491050940798,
"grad_norm": 0.24444169804629398,
"learning_rate": 5.333752811464599e-07,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10904049873352051,
"step": 3395,
"valid_targets_mean": 3510.9,
"valid_targets_min": 1014
},
{
"epoch": 4.677374942634236,
"grad_norm": 0.2482052812902979,
"learning_rate": 5.115669709945148e-07,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13949604332447052,
"step": 3400,
"valid_targets_mean": 4310.5,
"valid_targets_min": 1193
},
{
"epoch": 4.684258834327673,
"grad_norm": 0.22143585652156172,
"learning_rate": 4.90208083281456e-07,
"loss": 0.3763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11191027611494064,
"step": 3405,
"valid_targets_mean": 4566.1,
"valid_targets_min": 1394
},
{
"epoch": 4.691142726021111,
"grad_norm": 0.28442610184717354,
"learning_rate": 4.692991105642519e-07,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.159225732088089,
"step": 3410,
"valid_targets_mean": 3325.2,
"valid_targets_min": 883
},
{
"epoch": 4.698026617714548,
"grad_norm": 0.24884829886272836,
"learning_rate": 4.488405350243752e-07,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12980762124061584,
"step": 3415,
"valid_targets_mean": 3990.3,
"valid_targets_min": 1374
},
{
"epoch": 4.704910509407985,
"grad_norm": 0.3883368549041478,
"learning_rate": 4.288328284567156e-07,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11890369653701782,
"step": 3420,
"valid_targets_mean": 5897.4,
"valid_targets_min": 347
},
{
"epoch": 4.711794401101423,
"grad_norm": 0.37340217595337594,
"learning_rate": 4.092764522586601e-07,
"loss": 0.2684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07990404963493347,
"step": 3425,
"valid_targets_mean": 6455.6,
"valid_targets_min": 1359
},
{
"epoch": 4.71867829279486,
"grad_norm": 0.3565500859984899,
"learning_rate": 3.901718574194968e-07,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08166106045246124,
"step": 3430,
"valid_targets_mean": 6676.2,
"valid_targets_min": 1143
},
{
"epoch": 4.725562184488298,
"grad_norm": 0.313004986327095,
"learning_rate": 3.715194845099657e-07,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1039724126458168,
"step": 3435,
"valid_targets_mean": 6722.4,
"valid_targets_min": 505
},
{
"epoch": 4.732446076181735,
"grad_norm": 0.2809167735422918,
"learning_rate": 3.533197636721442e-07,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08939207345247269,
"step": 3440,
"valid_targets_mean": 7329.8,
"valid_targets_min": 1300
},
{
"epoch": 4.739329967875172,
"grad_norm": 0.2368355625717822,
"learning_rate": 3.3557311460949537e-07,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06595554202795029,
"step": 3445,
"valid_targets_mean": 6100.7,
"valid_targets_min": 1328
},
{
"epoch": 4.746213859568609,
"grad_norm": 0.24153571397417448,
"learning_rate": 3.182799465772135e-07,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05422850325703621,
"step": 3450,
"valid_targets_mean": 5562.0,
"valid_targets_min": 246
},
{
"epoch": 4.753097751262047,
"grad_norm": 0.2271226101292465,
"learning_rate": 3.014406583727603e-07,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05296333134174347,
"step": 3455,
"valid_targets_mean": 1929.8,
"valid_targets_min": 503
},
{
"epoch": 4.759981642955484,
"grad_norm": 0.21840229847924544,
"learning_rate": 2.8505563832669e-07,
"loss": 0.2358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0530148483812809,
"step": 3460,
"valid_targets_mean": 5253.4,
"valid_targets_min": 595
},
{
"epoch": 4.766865534648922,
"grad_norm": 0.21527749452897255,
"learning_rate": 2.691252642936859e-07,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06063324958086014,
"step": 3465,
"valid_targets_mean": 5247.3,
"valid_targets_min": 257
},
{
"epoch": 4.773749426342359,
"grad_norm": 0.19041316495333657,
"learning_rate": 2.5364990364384887e-07,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0600147545337677,
"step": 3470,
"valid_targets_mean": 5607.3,
"valid_targets_min": 452
},
{
"epoch": 4.780633318035797,
"grad_norm": 0.1842851141579877,
"learning_rate": 2.386299132542136e-07,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09336844086647034,
"step": 3475,
"valid_targets_mean": 7863.1,
"valid_targets_min": 1340
},
{
"epoch": 4.787517209729233,
"grad_norm": 0.20898692218205595,
"learning_rate": 2.240656395005414e-07,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13251468539237976,
"step": 3480,
"valid_targets_mean": 7620.9,
"valid_targets_min": 1084
},
{
"epoch": 4.794401101422671,
"grad_norm": 0.18482544111086033,
"learning_rate": 2.0995741824931138e-07,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06816096603870392,
"step": 3485,
"valid_targets_mean": 5906.8,
"valid_targets_min": 1288
},
{
"epoch": 4.801284993116108,
"grad_norm": 0.20241099039229132,
"learning_rate": 1.9630557484998647e-07,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0711783766746521,
"step": 3490,
"valid_targets_mean": 5153.4,
"valid_targets_min": 221
},
{
"epoch": 4.808168884809546,
"grad_norm": 0.18774049657388894,
"learning_rate": 1.8311042412750613e-07,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08386833965778351,
"step": 3495,
"valid_targets_mean": 7219.4,
"valid_targets_min": 219
},
{
"epoch": 4.815052776502983,
"grad_norm": 0.1814257677961071,
"learning_rate": 1.7037227037502546e-07,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06124308705329895,
"step": 3500,
"valid_targets_mean": 5985.7,
"valid_targets_min": 292
},
{
"epoch": 4.82193666819642,
"grad_norm": 0.17570467156043065,
"learning_rate": 1.5809140734690753e-07,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0560992956161499,
"step": 3505,
"valid_targets_mean": 5758.3,
"valid_targets_min": 310
},
{
"epoch": 4.8288205598898575,
"grad_norm": 0.16687189317724344,
"learning_rate": 1.4626811825192878e-07,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04680527746677399,
"step": 3510,
"valid_targets_mean": 5599.4,
"valid_targets_min": 982
},
{
"epoch": 4.835704451583295,
"grad_norm": 0.21506554619197757,
"learning_rate": 1.3490267574677528e-07,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.04162397235631943,
"step": 3515,
"valid_targets_mean": 2148.5,
"valid_targets_min": 457
},
{
"epoch": 4.8425883432767325,
"grad_norm": 0.3635867246852746,
"learning_rate": 1.2399534192972797e-07,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0672360360622406,
"step": 3520,
"valid_targets_mean": 4059.2,
"valid_targets_min": 1287
},
{
"epoch": 4.84947223497017,
"grad_norm": 0.3310539168438136,
"learning_rate": 1.1354636833463827e-07,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06172456964850426,
"step": 3525,
"valid_targets_mean": 3782.6,
"valid_targets_min": 428
},
{
"epoch": 4.8563561266636075,
"grad_norm": 0.33237941211528377,
"learning_rate": 1.0355599592511534e-07,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05413079261779785,
"step": 3530,
"valid_targets_mean": 3465.6,
"valid_targets_min": 478
},
{
"epoch": 4.863240018357045,
"grad_norm": 0.3094248279076241,
"learning_rate": 9.402445508897685e-08,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05988271161913872,
"step": 3535,
"valid_targets_mean": 3961.8,
"valid_targets_min": 534
},
{
"epoch": 4.870123910050482,
"grad_norm": 0.29242550385557875,
"learning_rate": 8.495196563293118e-08,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05963732674717903,
"step": 3540,
"valid_targets_mean": 3737.8,
"valid_targets_min": 572
},
{
"epoch": 4.877007801743919,
"grad_norm": 0.28190238416129615,
"learning_rate": 7.633873677751036e-08,
"loss": 0.1744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0610860139131546,
"step": 3545,
"valid_targets_mean": 3892.3,
"valid_targets_min": 419
},
{
"epoch": 4.883891693437357,
"grad_norm": 0.264213197144755,
"learning_rate": 6.818496715224721e-08,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.056852683424949646,
"step": 3550,
"valid_targets_mean": 3785.3,
"valid_targets_min": 578
},
{
"epoch": 4.890775585130794,
"grad_norm": 0.28203213789656356,
"learning_rate": 6.049084479109013e-08,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06058082729578018,
"step": 3555,
"valid_targets_mean": 3731.7,
"valid_targets_min": 430
},
{
"epoch": 4.897659476824232,
"grad_norm": 0.27415518234666697,
"learning_rate": 5.325654712807105e-08,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06047704070806503,
"step": 3560,
"valid_targets_mean": 3858.8,
"valid_targets_min": 704
},
{
"epoch": 4.904543368517668,
"grad_norm": 0.26692167270191103,
"learning_rate": 4.648224099321086e-08,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05759282037615776,
"step": 3565,
"valid_targets_mean": 3910.5,
"valid_targets_min": 433
},
{
"epoch": 4.911427260211106,
"grad_norm": 0.2613036512368632,
"learning_rate": 4.0168082608673666e-08,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05626670643687248,
"step": 3570,
"valid_targets_mean": 3696.9,
"valid_targets_min": 731
},
{
"epoch": 4.918311151904543,
"grad_norm": 0.2732742564108753,
"learning_rate": 3.431421758516518e-08,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0582839772105217,
"step": 3575,
"valid_targets_mean": 3753.9,
"valid_targets_min": 422
},
{
"epoch": 4.925195043597981,
"grad_norm": 0.25102179097888444,
"learning_rate": 2.8920780918570978e-08,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05331850051879883,
"step": 3580,
"valid_targets_mean": 3556.3,
"valid_targets_min": 462
},
{
"epoch": 4.932078935291418,
"grad_norm": 0.29257791826753676,
"learning_rate": 2.398789698684789e-08,
"loss": 0.1683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.059953607618808746,
"step": 3585,
"valid_targets_mean": 4006.8,
"valid_targets_min": 642
},
{
"epoch": 4.938962826984856,
"grad_norm": 0.524215825875638,
"learning_rate": 1.9515679547148504e-08,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10526755452156067,
"step": 3590,
"valid_targets_mean": 6701.7,
"valid_targets_min": 330
},
{
"epoch": 4.945846718678293,
"grad_norm": 0.5722645906369648,
"learning_rate": 1.550423173321214e-08,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09603773057460785,
"step": 3595,
"valid_targets_mean": 7118.6,
"valid_targets_min": 371
},
{
"epoch": 4.95273061037173,
"grad_norm": 0.5749651710529045,
"learning_rate": 1.1953646052969004e-08,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07218396663665771,
"step": 3600,
"valid_targets_mean": 6525.2,
"valid_targets_min": 437
},
{
"epoch": 4.959614502065167,
"grad_norm": 0.5773146128652207,
"learning_rate": 8.864004386419655e-09,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08016687631607056,
"step": 3605,
"valid_targets_mean": 6868.0,
"valid_targets_min": 860
},
{
"epoch": 4.966498393758605,
"grad_norm": 0.5465195501823726,
"learning_rate": 6.235377983738744e-09,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0723617821931839,
"step": 3610,
"valid_targets_mean": 5525.6,
"valid_targets_min": 398
},
{
"epoch": 4.973382285452042,
"grad_norm": 0.5787672219727664,
"learning_rate": 4.067827463638541e-09,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07634909451007843,
"step": 3615,
"valid_targets_mean": 6691.8,
"valid_targets_min": 327
},
{
"epoch": 4.98026617714548,
"grad_norm": 0.5163551559182284,
"learning_rate": 2.3614028119656186e-09,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0796852856874466,
"step": 3620,
"valid_targets_mean": 7097.7,
"valid_targets_min": 411
},
{
"epoch": 4.9871500688389165,
"grad_norm": 0.5453881277330466,
"learning_rate": 1.116143380552881e-09,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0733230710029602,
"step": 3625,
"valid_targets_mean": 6452.2,
"valid_targets_min": 250
},
{
"epoch": 4.994033960532354,
"grad_norm": 0.55973181421581,
"learning_rate": 3.320778863069585e-10,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07475747168064117,
"step": 3630,
"valid_targets_mean": 6448.4,
"valid_targets_min": 117
},
{
"epoch": 5.0,
"grad_norm": 0.9253128603774515,
"learning_rate": 9.224410548736018e-12,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3323420286178589,
"step": 3635,
"valid_targets_mean": 6423.8,
"valid_targets_min": 192
},
{
"epoch": 5.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3323420286178589,
"step": 3635,
"total_flos": 1.1450092629186839e+19,
"train_loss": 0.14989610923533592,
"train_runtime": 39124.5476,
"train_samples_per_second": 8.909,
"train_steps_per_second": 0.093,
"valid_targets_mean": 6423.8,
"valid_targets_min": 192
}
],
"logging_steps": 5,
"max_steps": 3635,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 300,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.1450092629186839e+19,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}