Files
a1-staqc/trainer_state.json
ModelHub XC 9e8f9161c6 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-staqc
Source: Original Platform
2026-05-04 03:40:47 +08:00

9541 lines
264 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4319,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008103727714748784,
"grad_norm": 14.502046563847436,
"learning_rate": 3.7037037037037036e-07,
"loss": 0.8801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9242562651634216,
"step": 5,
"valid_targets_mean": 4295.1,
"valid_targets_min": 1096
},
{
"epoch": 0.01620745542949757,
"grad_norm": 15.903096275441944,
"learning_rate": 8.333333333333333e-07,
"loss": 0.8843,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.0109663009643555,
"step": 10,
"valid_targets_mean": 4119.3,
"valid_targets_min": 1110
},
{
"epoch": 0.024311183144246355,
"grad_norm": 12.890655417344467,
"learning_rate": 1.2962962962962962e-06,
"loss": 0.8416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8123115301132202,
"step": 15,
"valid_targets_mean": 3726.6,
"valid_targets_min": 696
},
{
"epoch": 0.03241491085899514,
"grad_norm": 10.128730652201147,
"learning_rate": 1.7592592592592594e-06,
"loss": 0.785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.718390703201294,
"step": 20,
"valid_targets_mean": 3520.1,
"valid_targets_min": 985
},
{
"epoch": 0.04051863857374392,
"grad_norm": 7.138044910532352,
"learning_rate": 2.222222222222222e-06,
"loss": 0.7489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7211443185806274,
"step": 25,
"valid_targets_mean": 4349.3,
"valid_targets_min": 1351
},
{
"epoch": 0.04862236628849271,
"grad_norm": 4.932655033986416,
"learning_rate": 2.6851851851851856e-06,
"loss": 0.7511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6623836755752563,
"step": 30,
"valid_targets_mean": 3442.4,
"valid_targets_min": 1153
},
{
"epoch": 0.05672609400324149,
"grad_norm": 3.188346911958201,
"learning_rate": 3.1481481481481483e-06,
"loss": 0.7389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7061078548431396,
"step": 35,
"valid_targets_mean": 3195.9,
"valid_targets_min": 1017
},
{
"epoch": 0.06482982171799027,
"grad_norm": 2.155975188008163,
"learning_rate": 3.6111111111111115e-06,
"loss": 0.6625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6780894994735718,
"step": 40,
"valid_targets_mean": 3058.6,
"valid_targets_min": 1235
},
{
"epoch": 0.07293354943273905,
"grad_norm": 1.5267785030853465,
"learning_rate": 4.074074074074074e-06,
"loss": 0.633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7597166299819946,
"step": 45,
"valid_targets_mean": 4936.4,
"valid_targets_min": 1436
},
{
"epoch": 0.08103727714748785,
"grad_norm": 1.4912835751224582,
"learning_rate": 4.537037037037038e-06,
"loss": 0.6283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6779534816741943,
"step": 50,
"valid_targets_mean": 2796.6,
"valid_targets_min": 823
},
{
"epoch": 0.08914100486223663,
"grad_norm": 1.2109844973016437,
"learning_rate": 5e-06,
"loss": 0.602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.619255542755127,
"step": 55,
"valid_targets_mean": 2768.4,
"valid_targets_min": 351
},
{
"epoch": 0.09724473257698542,
"grad_norm": 0.7300524443363055,
"learning_rate": 5.462962962962963e-06,
"loss": 0.6097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5387172698974609,
"step": 60,
"valid_targets_mean": 5398.2,
"valid_targets_min": 1450
},
{
"epoch": 0.1053484602917342,
"grad_norm": 0.6939352585635662,
"learning_rate": 5.925925925925926e-06,
"loss": 0.5651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4976433515548706,
"step": 65,
"valid_targets_mean": 5193.5,
"valid_targets_min": 260
},
{
"epoch": 0.11345218800648298,
"grad_norm": 0.8282020026122351,
"learning_rate": 6.3888888888888885e-06,
"loss": 0.5986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.562492847442627,
"step": 70,
"valid_targets_mean": 3213.2,
"valid_targets_min": 707
},
{
"epoch": 0.12155591572123177,
"grad_norm": 0.8388747146684071,
"learning_rate": 6.851851851851853e-06,
"loss": 0.5874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6159340143203735,
"step": 75,
"valid_targets_mean": 3616.1,
"valid_targets_min": 998
},
{
"epoch": 0.12965964343598055,
"grad_norm": 0.6349565573978161,
"learning_rate": 7.314814814814816e-06,
"loss": 0.5918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5378053784370422,
"step": 80,
"valid_targets_mean": 4808.6,
"valid_targets_min": 1076
},
{
"epoch": 0.13776337115072934,
"grad_norm": 0.6866539798766335,
"learning_rate": 7.77777777777778e-06,
"loss": 0.5544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5045327544212341,
"step": 85,
"valid_targets_mean": 4616.6,
"valid_targets_min": 1327
},
{
"epoch": 0.1458670988654781,
"grad_norm": 0.7135765247596682,
"learning_rate": 8.240740740740741e-06,
"loss": 0.5973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5626544952392578,
"step": 90,
"valid_targets_mean": 3737.9,
"valid_targets_min": 988
},
{
"epoch": 0.1539708265802269,
"grad_norm": 0.8944356346358915,
"learning_rate": 8.703703703703705e-06,
"loss": 0.5711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5422185659408569,
"step": 95,
"valid_targets_mean": 3383.4,
"valid_targets_min": 1063
},
{
"epoch": 0.1620745542949757,
"grad_norm": 0.6752326811138456,
"learning_rate": 9.166666666666666e-06,
"loss": 0.5453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5315940380096436,
"step": 100,
"valid_targets_mean": 3757.1,
"valid_targets_min": 916
},
{
"epoch": 0.17017828200972449,
"grad_norm": 0.7034188800227436,
"learning_rate": 9.62962962962963e-06,
"loss": 0.5076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5128780603408813,
"step": 105,
"valid_targets_mean": 3490.1,
"valid_targets_min": 1364
},
{
"epoch": 0.17828200972447325,
"grad_norm": 0.8563770301799251,
"learning_rate": 1.0092592592592594e-05,
"loss": 0.5609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6451968550682068,
"step": 110,
"valid_targets_mean": 3104.2,
"valid_targets_min": 714
},
{
"epoch": 0.18638573743922204,
"grad_norm": 0.6977828625213393,
"learning_rate": 1.0555555555555557e-05,
"loss": 0.5463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5652469396591187,
"step": 115,
"valid_targets_mean": 3494.4,
"valid_targets_min": 962
},
{
"epoch": 0.19448946515397084,
"grad_norm": 0.7024165934230638,
"learning_rate": 1.1018518518518519e-05,
"loss": 0.5138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48960810899734497,
"step": 120,
"valid_targets_mean": 3552.3,
"valid_targets_min": 942
},
{
"epoch": 0.2025931928687196,
"grad_norm": 0.6711618444311361,
"learning_rate": 1.1481481481481482e-05,
"loss": 0.5164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48685699701309204,
"step": 125,
"valid_targets_mean": 4097.9,
"valid_targets_min": 1264
},
{
"epoch": 0.2106969205834684,
"grad_norm": 0.8895538573513374,
"learning_rate": 1.1944444444444444e-05,
"loss": 0.5224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5535306930541992,
"step": 130,
"valid_targets_mean": 2476.7,
"valid_targets_min": 985
},
{
"epoch": 0.2188006482982172,
"grad_norm": 0.7147279273965873,
"learning_rate": 1.2407407407407408e-05,
"loss": 0.5609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5410614609718323,
"step": 135,
"valid_targets_mean": 3292.9,
"valid_targets_min": 1219
},
{
"epoch": 0.22690437601296595,
"grad_norm": 0.5760847796962758,
"learning_rate": 1.2870370370370371e-05,
"loss": 0.5127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4297313690185547,
"step": 140,
"valid_targets_mean": 4090.2,
"valid_targets_min": 1376
},
{
"epoch": 0.23500810372771475,
"grad_norm": 0.6252622714518827,
"learning_rate": 1.3333333333333333e-05,
"loss": 0.5182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4308566451072693,
"step": 145,
"valid_targets_mean": 3886.9,
"valid_targets_min": 1244
},
{
"epoch": 0.24311183144246354,
"grad_norm": 0.664417459291334,
"learning_rate": 1.3796296296296297e-05,
"loss": 0.5026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49792343378067017,
"step": 150,
"valid_targets_mean": 3989.4,
"valid_targets_min": 987
},
{
"epoch": 0.25121555915721233,
"grad_norm": 0.4487043325414751,
"learning_rate": 1.4259259259259259e-05,
"loss": 0.4752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36317574977874756,
"step": 155,
"valid_targets_mean": 6837.2,
"valid_targets_min": 1064
},
{
"epoch": 0.2593192868719611,
"grad_norm": 0.6029473626318651,
"learning_rate": 1.4722222222222224e-05,
"loss": 0.5177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44724512100219727,
"step": 160,
"valid_targets_mean": 4923.8,
"valid_targets_min": 1165
},
{
"epoch": 0.26742301458670986,
"grad_norm": 0.5768270103259813,
"learning_rate": 1.5185185185185187e-05,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4138815999031067,
"step": 165,
"valid_targets_mean": 4088.1,
"valid_targets_min": 887
},
{
"epoch": 0.2755267423014587,
"grad_norm": 0.5493315381239489,
"learning_rate": 1.564814814814815e-05,
"loss": 0.4689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44827204942703247,
"step": 170,
"valid_targets_mean": 5288.2,
"valid_targets_min": 1507
},
{
"epoch": 0.28363047001620745,
"grad_norm": 0.7994248985246581,
"learning_rate": 1.6111111111111115e-05,
"loss": 0.4863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5198005437850952,
"step": 175,
"valid_targets_mean": 2657.2,
"valid_targets_min": 1139
},
{
"epoch": 0.2917341977309562,
"grad_norm": 0.9722413882474711,
"learning_rate": 1.6574074074074075e-05,
"loss": 0.513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5183806419372559,
"step": 180,
"valid_targets_mean": 3431.2,
"valid_targets_min": 845
},
{
"epoch": 0.29983792544570503,
"grad_norm": 0.6589835217769006,
"learning_rate": 1.7037037037037038e-05,
"loss": 0.5393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5170410871505737,
"step": 185,
"valid_targets_mean": 5086.8,
"valid_targets_min": 1333
},
{
"epoch": 0.3079416531604538,
"grad_norm": 0.6967830216075351,
"learning_rate": 1.7500000000000002e-05,
"loss": 0.4479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47171273827552795,
"step": 190,
"valid_targets_mean": 4035.7,
"valid_targets_min": 1039
},
{
"epoch": 0.3160453808752026,
"grad_norm": 0.821386141264342,
"learning_rate": 1.7962962962962965e-05,
"loss": 0.5305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6754404902458191,
"step": 195,
"valid_targets_mean": 3246.0,
"valid_targets_min": 1267
},
{
"epoch": 0.3241491085899514,
"grad_norm": 0.7996690171267771,
"learning_rate": 1.8425925925925926e-05,
"loss": 0.4836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4826638996601105,
"step": 200,
"valid_targets_mean": 2741.5,
"valid_targets_min": 1119
},
{
"epoch": 0.33225283630470015,
"grad_norm": 0.7619254088595571,
"learning_rate": 1.888888888888889e-05,
"loss": 0.4903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47676026821136475,
"step": 205,
"valid_targets_mean": 3212.6,
"valid_targets_min": 849
},
{
"epoch": 0.34035656401944897,
"grad_norm": 0.6571212058463909,
"learning_rate": 1.9351851851851853e-05,
"loss": 0.5098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5193724036216736,
"step": 210,
"valid_targets_mean": 4616.6,
"valid_targets_min": 1602
},
{
"epoch": 0.34846029173419774,
"grad_norm": 0.6304645656002126,
"learning_rate": 1.9814814814814816e-05,
"loss": 0.503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.446179062128067,
"step": 215,
"valid_targets_mean": 4198.4,
"valid_targets_min": 688
},
{
"epoch": 0.3565640194489465,
"grad_norm": 0.797707714974618,
"learning_rate": 2.027777777777778e-05,
"loss": 0.4763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5235961675643921,
"step": 220,
"valid_targets_mean": 3196.6,
"valid_targets_min": 1181
},
{
"epoch": 0.3646677471636953,
"grad_norm": 0.8339761763253815,
"learning_rate": 2.074074074074074e-05,
"loss": 0.5363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5340523719787598,
"step": 225,
"valid_targets_mean": 3011.3,
"valid_targets_min": 1068
},
{
"epoch": 0.3727714748784441,
"grad_norm": 0.8061816435780602,
"learning_rate": 2.1203703703703703e-05,
"loss": 0.4665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3998042941093445,
"step": 230,
"valid_targets_mean": 3933.1,
"valid_targets_min": 1459
},
{
"epoch": 0.38087520259319285,
"grad_norm": 0.8327959127590774,
"learning_rate": 2.1666666666666667e-05,
"loss": 0.462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5590848922729492,
"step": 235,
"valid_targets_mean": 3193.1,
"valid_targets_min": 1423
},
{
"epoch": 0.3889789303079417,
"grad_norm": 0.7369049954720542,
"learning_rate": 2.212962962962963e-05,
"loss": 0.4519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47498127818107605,
"step": 240,
"valid_targets_mean": 3404.8,
"valid_targets_min": 1482
},
{
"epoch": 0.39708265802269044,
"grad_norm": 0.7763169284637017,
"learning_rate": 2.2592592592592594e-05,
"loss": 0.4707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39968666434288025,
"step": 245,
"valid_targets_mean": 3643.1,
"valid_targets_min": 890
},
{
"epoch": 0.4051863857374392,
"grad_norm": 0.5745074030464737,
"learning_rate": 2.3055555555555554e-05,
"loss": 0.4828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4340120851993561,
"step": 250,
"valid_targets_mean": 4889.4,
"valid_targets_min": 1652
},
{
"epoch": 0.413290113452188,
"grad_norm": 0.6509176855544626,
"learning_rate": 2.3518518518518518e-05,
"loss": 0.48,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4259786605834961,
"step": 255,
"valid_targets_mean": 4724.8,
"valid_targets_min": 1665
},
{
"epoch": 0.4213938411669368,
"grad_norm": 0.6382937773930243,
"learning_rate": 2.3981481481481485e-05,
"loss": 0.4641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4811030626296997,
"step": 260,
"valid_targets_mean": 3824.5,
"valid_targets_min": 958
},
{
"epoch": 0.42949756888168555,
"grad_norm": 0.7814960892271423,
"learning_rate": 2.444444444444445e-05,
"loss": 0.4826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4951825737953186,
"step": 265,
"valid_targets_mean": 2962.9,
"valid_targets_min": 1195
},
{
"epoch": 0.4376012965964344,
"grad_norm": 0.7860611727969448,
"learning_rate": 2.4907407407407412e-05,
"loss": 0.5235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.465817928314209,
"step": 270,
"valid_targets_mean": 4154.8,
"valid_targets_min": 1001
},
{
"epoch": 0.44570502431118314,
"grad_norm": 0.7225875405455014,
"learning_rate": 2.5370370370370375e-05,
"loss": 0.4314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4747081995010376,
"step": 275,
"valid_targets_mean": 3147.5,
"valid_targets_min": 1231
},
{
"epoch": 0.4538087520259319,
"grad_norm": 0.7579343166171137,
"learning_rate": 2.5833333333333336e-05,
"loss": 0.4712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4651714265346527,
"step": 280,
"valid_targets_mean": 2885.6,
"valid_targets_min": 916
},
{
"epoch": 0.4619124797406807,
"grad_norm": 0.6458345103499519,
"learning_rate": 2.62962962962963e-05,
"loss": 0.479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44281134009361267,
"step": 285,
"valid_targets_mean": 4319.7,
"valid_targets_min": 1245
},
{
"epoch": 0.4700162074554295,
"grad_norm": 0.7007184493552016,
"learning_rate": 2.6759259259259263e-05,
"loss": 0.4632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43551719188690186,
"step": 290,
"valid_targets_mean": 3202.4,
"valid_targets_min": 342
},
{
"epoch": 0.47811993517017826,
"grad_norm": 0.7307318580304619,
"learning_rate": 2.7222222222222226e-05,
"loss": 0.4552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4373762607574463,
"step": 295,
"valid_targets_mean": 3294.9,
"valid_targets_min": 1019
},
{
"epoch": 0.4862236628849271,
"grad_norm": 0.9011037479565293,
"learning_rate": 2.768518518518519e-05,
"loss": 0.4564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4616827368736267,
"step": 300,
"valid_targets_mean": 2662.6,
"valid_targets_min": 1290
},
{
"epoch": 0.49432739059967584,
"grad_norm": 0.7121661911160081,
"learning_rate": 2.814814814814815e-05,
"loss": 0.4694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42763668298721313,
"step": 305,
"valid_targets_mean": 3236.9,
"valid_targets_min": 815
},
{
"epoch": 0.5024311183144247,
"grad_norm": 0.8096707896642864,
"learning_rate": 2.8611111111111113e-05,
"loss": 0.4287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4525720775127411,
"step": 310,
"valid_targets_mean": 2636.4,
"valid_targets_min": 999
},
{
"epoch": 0.5105348460291734,
"grad_norm": 0.7261203808002379,
"learning_rate": 2.9074074074074077e-05,
"loss": 0.4664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48865166306495667,
"step": 315,
"valid_targets_mean": 3461.4,
"valid_targets_min": 897
},
{
"epoch": 0.5186385737439222,
"grad_norm": 1.2575281945746308,
"learning_rate": 2.953703703703704e-05,
"loss": 0.4828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5157779455184937,
"step": 320,
"valid_targets_mean": 2379.4,
"valid_targets_min": 1189
},
{
"epoch": 0.526742301458671,
"grad_norm": 0.7251897026165784,
"learning_rate": 3.0000000000000004e-05,
"loss": 0.4352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46817487478256226,
"step": 325,
"valid_targets_mean": 3586.9,
"valid_targets_min": 1204
},
{
"epoch": 0.5348460291734197,
"grad_norm": 0.7598243027449975,
"learning_rate": 3.0462962962962964e-05,
"loss": 0.4647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40748733282089233,
"step": 330,
"valid_targets_mean": 3351.0,
"valid_targets_min": 1153
},
{
"epoch": 0.5429497568881686,
"grad_norm": 0.5867804558692091,
"learning_rate": 3.092592592592593e-05,
"loss": 0.4548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3633122146129608,
"step": 335,
"valid_targets_mean": 4532.9,
"valid_targets_min": 1330
},
{
"epoch": 0.5510534846029174,
"grad_norm": 0.8308762981819495,
"learning_rate": 3.138888888888889e-05,
"loss": 0.4196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44768840074539185,
"step": 340,
"valid_targets_mean": 2915.2,
"valid_targets_min": 1129
},
{
"epoch": 0.5591572123176661,
"grad_norm": 0.7168296495416179,
"learning_rate": 3.185185185185185e-05,
"loss": 0.4715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47569552063941956,
"step": 345,
"valid_targets_mean": 3553.9,
"valid_targets_min": 934
},
{
"epoch": 0.5672609400324149,
"grad_norm": 0.7779706686981114,
"learning_rate": 3.231481481481482e-05,
"loss": 0.4571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45146211981773376,
"step": 350,
"valid_targets_mean": 2965.0,
"valid_targets_min": 1124
},
{
"epoch": 0.5753646677471637,
"grad_norm": 0.6521122222225881,
"learning_rate": 3.277777777777778e-05,
"loss": 0.4165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.383737713098526,
"step": 355,
"valid_targets_mean": 3290.4,
"valid_targets_min": 445
},
{
"epoch": 0.5834683954619124,
"grad_norm": 0.6903093659168319,
"learning_rate": 3.3240740740740746e-05,
"loss": 0.4344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44812503457069397,
"step": 360,
"valid_targets_mean": 3197.4,
"valid_targets_min": 993
},
{
"epoch": 0.5915721231766613,
"grad_norm": 0.5893356617898746,
"learning_rate": 3.3703703703703706e-05,
"loss": 0.4698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43500688672065735,
"step": 365,
"valid_targets_mean": 4616.5,
"valid_targets_min": 1276
},
{
"epoch": 0.5996758508914101,
"grad_norm": 0.5704634541622681,
"learning_rate": 3.4166666666666666e-05,
"loss": 0.4545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4581429362297058,
"step": 370,
"valid_targets_mean": 5007.1,
"valid_targets_min": 1027
},
{
"epoch": 0.6077795786061588,
"grad_norm": 0.6250080462027718,
"learning_rate": 3.462962962962963e-05,
"loss": 0.4421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4598006308078766,
"step": 375,
"valid_targets_mean": 4201.1,
"valid_targets_min": 1594
},
{
"epoch": 0.6158833063209076,
"grad_norm": 0.604145580512504,
"learning_rate": 3.509259259259259e-05,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38162094354629517,
"step": 380,
"valid_targets_mean": 4180.4,
"valid_targets_min": 1192
},
{
"epoch": 0.6239870340356564,
"grad_norm": 0.8135079481344287,
"learning_rate": 3.555555555555555e-05,
"loss": 0.5118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5114529132843018,
"step": 385,
"valid_targets_mean": 2778.4,
"valid_targets_min": 1183
},
{
"epoch": 0.6320907617504052,
"grad_norm": 0.7156111178744403,
"learning_rate": 3.601851851851852e-05,
"loss": 0.4418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42450952529907227,
"step": 390,
"valid_targets_mean": 2836.8,
"valid_targets_min": 1203
},
{
"epoch": 0.640194489465154,
"grad_norm": 0.6233850159032864,
"learning_rate": 3.648148148148149e-05,
"loss": 0.4337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4477499723434448,
"step": 395,
"valid_targets_mean": 4234.6,
"valid_targets_min": 1001
},
{
"epoch": 0.6482982171799028,
"grad_norm": 0.6873205556027221,
"learning_rate": 3.694444444444445e-05,
"loss": 0.4436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4863933324813843,
"step": 400,
"valid_targets_mean": 3356.6,
"valid_targets_min": 1213
},
{
"epoch": 0.6564019448946515,
"grad_norm": 0.5459953172678582,
"learning_rate": 3.7407407407407414e-05,
"loss": 0.4143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35290199518203735,
"step": 405,
"valid_targets_mean": 4598.9,
"valid_targets_min": 983
},
{
"epoch": 0.6645056726094003,
"grad_norm": 0.6910108927145312,
"learning_rate": 3.7870370370370374e-05,
"loss": 0.4879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44417983293533325,
"step": 410,
"valid_targets_mean": 3119.1,
"valid_targets_min": 1184
},
{
"epoch": 0.6726094003241491,
"grad_norm": 0.5251638853973931,
"learning_rate": 3.833333333333334e-05,
"loss": 0.4003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3857458829879761,
"step": 415,
"valid_targets_mean": 5829.8,
"valid_targets_min": 1662
},
{
"epoch": 0.6807131280388979,
"grad_norm": 0.5492363264332838,
"learning_rate": 3.87962962962963e-05,
"loss": 0.4234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3834828734397888,
"step": 420,
"valid_targets_mean": 4159.3,
"valid_targets_min": 403
},
{
"epoch": 0.6888168557536467,
"grad_norm": 0.6657955711902417,
"learning_rate": 3.925925925925926e-05,
"loss": 0.4585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4726736545562744,
"step": 425,
"valid_targets_mean": 4370.1,
"valid_targets_min": 992
},
{
"epoch": 0.6969205834683955,
"grad_norm": 0.8215679499444706,
"learning_rate": 3.972222222222223e-05,
"loss": 0.4492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5097543597221375,
"step": 430,
"valid_targets_mean": 2555.1,
"valid_targets_min": 1160
},
{
"epoch": 0.7050243111831442,
"grad_norm": 0.6324092514283729,
"learning_rate": 3.99999738705324e-05,
"loss": 0.4479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3866470158100128,
"step": 435,
"valid_targets_mean": 3941.9,
"valid_targets_min": 1237
},
{
"epoch": 0.713128038897893,
"grad_norm": 0.7808262105006745,
"learning_rate": 3.999967991480598e-05,
"loss": 0.4242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4729665517807007,
"step": 440,
"valid_targets_mean": 2932.7,
"valid_targets_min": 1097
},
{
"epoch": 0.7212317666126418,
"grad_norm": 0.6797144276661182,
"learning_rate": 3.99990593463352e-05,
"loss": 0.4634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47761768102645874,
"step": 445,
"valid_targets_mean": 3771.3,
"valid_targets_min": 1436
},
{
"epoch": 0.7293354943273906,
"grad_norm": 0.7894421925623699,
"learning_rate": 3.9998112175254504e-05,
"loss": 0.4495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48762065172195435,
"step": 450,
"valid_targets_mean": 2831.8,
"valid_targets_min": 1503
},
{
"epoch": 0.7374392220421394,
"grad_norm": 0.7071798523471358,
"learning_rate": 3.9996838417032044e-05,
"loss": 0.4311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5425790548324585,
"step": 455,
"valid_targets_mean": 3630.4,
"valid_targets_min": 1009
},
{
"epoch": 0.7455429497568882,
"grad_norm": 0.85816434814954,
"learning_rate": 3.999523809246943e-05,
"loss": 0.4367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45270124077796936,
"step": 460,
"valid_targets_mean": 2890.2,
"valid_targets_min": 1181
},
{
"epoch": 0.7536466774716369,
"grad_norm": 0.7183863410015342,
"learning_rate": 3.9993311227701415e-05,
"loss": 0.4237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.481193482875824,
"step": 465,
"valid_targets_mean": 2988.1,
"valid_targets_min": 1100
},
{
"epoch": 0.7617504051863857,
"grad_norm": 0.5698856112206491,
"learning_rate": 3.9991057854195424e-05,
"loss": 0.4704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.550667405128479,
"step": 470,
"valid_targets_mean": 5871.3,
"valid_targets_min": 749
},
{
"epoch": 0.7698541329011345,
"grad_norm": 0.6288923533755414,
"learning_rate": 3.998847800875107e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4150170087814331,
"step": 475,
"valid_targets_mean": 3744.1,
"valid_targets_min": 1145
},
{
"epoch": 0.7779578606158833,
"grad_norm": 0.7841484146071308,
"learning_rate": 3.9985571733499544e-05,
"loss": 0.4228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4479774832725525,
"step": 480,
"valid_targets_mean": 2472.2,
"valid_targets_min": 1320
},
{
"epoch": 0.7860615883306321,
"grad_norm": 0.700045967636308,
"learning_rate": 3.998233907590294e-05,
"loss": 0.4584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44580456614494324,
"step": 485,
"valid_targets_mean": 3343.3,
"valid_targets_min": 1102
},
{
"epoch": 0.7941653160453809,
"grad_norm": 0.629997635377666,
"learning_rate": 3.9978780088753464e-05,
"loss": 0.4529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4441825747489929,
"step": 490,
"valid_targets_mean": 3981.2,
"valid_targets_min": 1551
},
{
"epoch": 0.8022690437601296,
"grad_norm": 0.6817904477118991,
"learning_rate": 3.997489483017256e-05,
"loss": 0.4131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4390064477920532,
"step": 495,
"valid_targets_mean": 3689.6,
"valid_targets_min": 1495
},
{
"epoch": 0.8103727714748784,
"grad_norm": 0.6185939925084256,
"learning_rate": 3.997068336361e-05,
"loss": 0.4502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3633172810077667,
"step": 500,
"valid_targets_mean": 4270.8,
"valid_targets_min": 858
},
{
"epoch": 0.8184764991896273,
"grad_norm": 0.879292203617941,
"learning_rate": 3.996614575784282e-05,
"loss": 0.4163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4245051145553589,
"step": 505,
"valid_targets_mean": 4214.6,
"valid_targets_min": 1415
},
{
"epoch": 0.826580226904376,
"grad_norm": 0.7885150453655395,
"learning_rate": 3.99612820869742e-05,
"loss": 0.4717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4266160726547241,
"step": 510,
"valid_targets_mean": 2683.9,
"valid_targets_min": 1147
},
{
"epoch": 0.8346839546191248,
"grad_norm": 0.6732147232946274,
"learning_rate": 3.9956092430432254e-05,
"loss": 0.437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4329238533973694,
"step": 515,
"valid_targets_mean": 3728.2,
"valid_targets_min": 1153
},
{
"epoch": 0.8427876823338736,
"grad_norm": 0.8663697967068255,
"learning_rate": 3.9950576872968735e-05,
"loss": 0.4436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44332367181777954,
"step": 520,
"valid_targets_mean": 4120.1,
"valid_targets_min": 1120
},
{
"epoch": 0.8508914100486223,
"grad_norm": 0.6675209752863196,
"learning_rate": 3.994473550465765e-05,
"loss": 0.4373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42500463128089905,
"step": 525,
"valid_targets_mean": 3894.8,
"valid_targets_min": 1595
},
{
"epoch": 0.8589951377633711,
"grad_norm": 1.156331824829645,
"learning_rate": 3.993856842089379e-05,
"loss": 0.4993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4912262558937073,
"step": 530,
"valid_targets_mean": 2224.8,
"valid_targets_min": 813
},
{
"epoch": 0.86709886547812,
"grad_norm": 0.594392464554485,
"learning_rate": 3.99320757223912e-05,
"loss": 0.4307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4009823203086853,
"step": 535,
"valid_targets_mean": 4163.1,
"valid_targets_min": 1266
},
{
"epoch": 0.8752025931928687,
"grad_norm": 0.5042294566986941,
"learning_rate": 3.992525751518144e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3967186212539673,
"step": 540,
"valid_targets_mean": 6045.8,
"valid_targets_min": 1249
},
{
"epoch": 0.8833063209076175,
"grad_norm": 0.7508835619309017,
"learning_rate": 3.991811391061199e-05,
"loss": 0.394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41827213764190674,
"step": 545,
"valid_targets_mean": 3118.6,
"valid_targets_min": 349
},
{
"epoch": 0.8914100486223663,
"grad_norm": 2.109010732539915,
"learning_rate": 3.9910645025344324e-05,
"loss": 0.4496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4581921696662903,
"step": 550,
"valid_targets_mean": 4448.7,
"valid_targets_min": 1252
},
{
"epoch": 0.899513776337115,
"grad_norm": 0.505861640073071,
"learning_rate": 3.990285098135204e-05,
"loss": 0.4245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4023759365081787,
"step": 555,
"valid_targets_mean": 5656.4,
"valid_targets_min": 1084
},
{
"epoch": 0.9076175040518638,
"grad_norm": 0.7084642299995411,
"learning_rate": 3.98947319059189e-05,
"loss": 0.4338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4089127779006958,
"step": 560,
"valid_targets_mean": 3820.6,
"valid_targets_min": 800
},
{
"epoch": 0.9157212317666127,
"grad_norm": 0.7838903874181324,
"learning_rate": 3.988628793163669e-05,
"loss": 0.4763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47754400968551636,
"step": 565,
"valid_targets_mean": 3355.3,
"valid_targets_min": 1983
},
{
"epoch": 0.9238249594813615,
"grad_norm": 0.7697692626341919,
"learning_rate": 3.987751919640309e-05,
"loss": 0.4241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41041046380996704,
"step": 570,
"valid_targets_mean": 3666.2,
"valid_targets_min": 1160
},
{
"epoch": 0.9319286871961102,
"grad_norm": 0.5892131127706576,
"learning_rate": 3.9868425843419445e-05,
"loss": 0.4032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4179239571094513,
"step": 575,
"valid_targets_mean": 4579.3,
"valid_targets_min": 1043
},
{
"epoch": 0.940032414910859,
"grad_norm": 0.5400962924292961,
"learning_rate": 3.985900802118836e-05,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4245756268501282,
"step": 580,
"valid_targets_mean": 5453.4,
"valid_targets_min": 1178
},
{
"epoch": 0.9481361426256077,
"grad_norm": 0.6919745305835788,
"learning_rate": 3.984926588351135e-05,
"loss": 0.4518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45021432638168335,
"step": 585,
"valid_targets_mean": 3102.4,
"valid_targets_min": 296
},
{
"epoch": 0.9562398703403565,
"grad_norm": 0.6591393873889547,
"learning_rate": 3.983919958948627e-05,
"loss": 0.4142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42304936051368713,
"step": 590,
"valid_targets_mean": 3353.1,
"valid_targets_min": 1418
},
{
"epoch": 0.9643435980551054,
"grad_norm": 0.5632951141018055,
"learning_rate": 3.982880930350474e-05,
"loss": 0.4174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4031622111797333,
"step": 595,
"valid_targets_mean": 4799.3,
"valid_targets_min": 1247
},
{
"epoch": 0.9724473257698542,
"grad_norm": 0.5232136419625988,
"learning_rate": 3.981809519524948e-05,
"loss": 0.4119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3731626272201538,
"step": 600,
"valid_targets_mean": 4803.6,
"valid_targets_min": 906
},
{
"epoch": 0.9805510534846029,
"grad_norm": 0.6326091273919606,
"learning_rate": 3.98070574396915e-05,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42506226897239685,
"step": 605,
"valid_targets_mean": 4227.1,
"valid_targets_min": 692
},
{
"epoch": 0.9886547811993517,
"grad_norm": 0.6045895230930198,
"learning_rate": 3.979569621708727e-05,
"loss": 0.4239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5133014917373657,
"step": 610,
"valid_targets_mean": 4420.0,
"valid_targets_min": 1620
},
{
"epoch": 0.9967585089141004,
"grad_norm": 0.7123425243387163,
"learning_rate": 3.978401171297576e-05,
"loss": 0.4082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4153461456298828,
"step": 615,
"valid_targets_mean": 2826.6,
"valid_targets_min": 1183
},
{
"epoch": 1.0048622366288493,
"grad_norm": 0.539167883549107,
"learning_rate": 3.9772004118175424e-05,
"loss": 0.4051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4070894122123718,
"step": 620,
"valid_targets_mean": 4499.4,
"valid_targets_min": 1437
},
{
"epoch": 1.012965964343598,
"grad_norm": 0.6626488535519265,
"learning_rate": 3.975967362878106e-05,
"loss": 0.4298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5363422632217407,
"step": 625,
"valid_targets_mean": 4372.2,
"valid_targets_min": 1387
},
{
"epoch": 1.0210696920583469,
"grad_norm": 0.7049923386137342,
"learning_rate": 3.9747020446160665e-05,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.411579430103302,
"step": 630,
"valid_targets_mean": 3333.8,
"valid_targets_min": 260
},
{
"epoch": 1.0291734197730957,
"grad_norm": 0.6429529234872674,
"learning_rate": 3.973404477695207e-05,
"loss": 0.3909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4016868472099304,
"step": 635,
"valid_targets_mean": 3914.5,
"valid_targets_min": 964
},
{
"epoch": 1.0372771474878444,
"grad_norm": 0.8430734597321315,
"learning_rate": 3.972074683305961e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4546150863170624,
"step": 640,
"valid_targets_mean": 3274.8,
"valid_targets_min": 651
},
{
"epoch": 1.0453808752025933,
"grad_norm": 0.691765509979604,
"learning_rate": 3.970712683165066e-05,
"loss": 0.3941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3804226815700531,
"step": 645,
"valid_targets_mean": 3015.3,
"valid_targets_min": 1176
},
{
"epoch": 1.053484602917342,
"grad_norm": 0.7121115958430826,
"learning_rate": 3.969318499515208e-05,
"loss": 0.387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4142545163631439,
"step": 650,
"valid_targets_mean": 3504.2,
"valid_targets_min": 684
},
{
"epoch": 1.0615883306320908,
"grad_norm": 0.5999484561204884,
"learning_rate": 3.967892155124659e-05,
"loss": 0.4022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3854263424873352,
"step": 655,
"valid_targets_mean": 4220.0,
"valid_targets_min": 1095
},
{
"epoch": 1.0696920583468394,
"grad_norm": 0.5713234178165169,
"learning_rate": 3.9664336732869044e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3343764841556549,
"step": 660,
"valid_targets_mean": 3993.2,
"valid_targets_min": 1225
},
{
"epoch": 1.0777957860615883,
"grad_norm": 0.7329951448315434,
"learning_rate": 3.964943077820263e-05,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44141700863838196,
"step": 665,
"valid_targets_mean": 3044.4,
"valid_targets_min": 1388
},
{
"epoch": 1.0858995137763372,
"grad_norm": 0.7502131949551032,
"learning_rate": 3.963420393067499e-05,
"loss": 0.436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4431774616241455,
"step": 670,
"valid_targets_mean": 2909.8,
"valid_targets_min": 1386
},
{
"epoch": 1.0940032414910859,
"grad_norm": 0.5182332836674972,
"learning_rate": 3.961865643895422e-05,
"loss": 0.4116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863534986972809,
"step": 675,
"valid_targets_mean": 4810.2,
"valid_targets_min": 999
},
{
"epoch": 1.1021069692058347,
"grad_norm": 0.7191407703553409,
"learning_rate": 3.960278855694484e-05,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42751169204711914,
"step": 680,
"valid_targets_mean": 5616.1,
"valid_targets_min": 1414
},
{
"epoch": 1.1102106969205834,
"grad_norm": 0.5066897158392785,
"learning_rate": 3.958660054378361e-05,
"loss": 0.4463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33914482593536377,
"step": 685,
"valid_targets_mean": 5099.1,
"valid_targets_min": 1419
},
{
"epoch": 1.1183144246353323,
"grad_norm": 0.5236343651746419,
"learning_rate": 3.9570092663835334e-05,
"loss": 0.415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3773620128631592,
"step": 690,
"valid_targets_mean": 4685.4,
"valid_targets_min": 710
},
{
"epoch": 1.1264181523500811,
"grad_norm": 0.7039460112163713,
"learning_rate": 3.9553265186688525e-05,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44046705961227417,
"step": 695,
"valid_targets_mean": 3954.5,
"valid_targets_min": 1168
},
{
"epoch": 1.1345218800648298,
"grad_norm": 0.6654606056629773,
"learning_rate": 3.953611838715101e-05,
"loss": 0.4225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4078805446624756,
"step": 700,
"valid_targets_mean": 3752.2,
"valid_targets_min": 1312
},
{
"epoch": 1.1426256077795787,
"grad_norm": 0.6514465887784622,
"learning_rate": 3.951865254524542e-05,
"loss": 0.4026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3984151780605316,
"step": 705,
"valid_targets_mean": 3862.8,
"valid_targets_min": 1563
},
{
"epoch": 1.1507293354943273,
"grad_norm": 0.6471325396020866,
"learning_rate": 3.950086794620467e-05,
"loss": 0.4328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43052127957344055,
"step": 710,
"valid_targets_mean": 3554.1,
"valid_targets_min": 898
},
{
"epoch": 1.1588330632090762,
"grad_norm": 0.5873275500250088,
"learning_rate": 3.948276488046723e-05,
"loss": 0.396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3730786144733429,
"step": 715,
"valid_targets_mean": 3719.2,
"valid_targets_min": 1152
},
{
"epoch": 1.1669367909238249,
"grad_norm": 0.467522004257344,
"learning_rate": 3.946434364367243e-05,
"loss": 0.3867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3182247281074524,
"step": 720,
"valid_targets_mean": 5996.4,
"valid_targets_min": 349
},
{
"epoch": 1.1750405186385737,
"grad_norm": 0.6791400275737529,
"learning_rate": 3.9445604536655625e-05,
"loss": 0.4678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5305315256118774,
"step": 725,
"valid_targets_mean": 5634.3,
"valid_targets_min": 1711
},
{
"epoch": 1.1831442463533226,
"grad_norm": 0.5174903212149605,
"learning_rate": 3.9426547865443264e-05,
"loss": 0.4005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33829182386398315,
"step": 730,
"valid_targets_mean": 4885.6,
"valid_targets_min": 995
},
{
"epoch": 1.1912479740680713,
"grad_norm": 0.7597194711385206,
"learning_rate": 3.940717394124792e-05,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44391706585884094,
"step": 735,
"valid_targets_mean": 2776.8,
"valid_targets_min": 1116
},
{
"epoch": 1.1993517017828201,
"grad_norm": 0.7881689255335056,
"learning_rate": 3.938748308046318e-05,
"loss": 0.4106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44584935903549194,
"step": 740,
"valid_targets_mean": 3193.6,
"valid_targets_min": 1003
},
{
"epoch": 1.2074554294975688,
"grad_norm": 0.8381756076442425,
"learning_rate": 3.9367475604658485e-05,
"loss": 0.4037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4248051643371582,
"step": 745,
"valid_targets_mean": 2367.8,
"valid_targets_min": 1159
},
{
"epoch": 1.2155591572123177,
"grad_norm": 0.7159039861695103,
"learning_rate": 3.9347151840573915e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47999000549316406,
"step": 750,
"valid_targets_mean": 3596.5,
"valid_targets_min": 1075
},
{
"epoch": 1.2236628849270665,
"grad_norm": 0.6398486566542297,
"learning_rate": 3.932651212011479e-05,
"loss": 0.4168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5003429055213928,
"step": 755,
"valid_targets_mean": 5000.0,
"valid_targets_min": 358
},
{
"epoch": 1.2317666126418152,
"grad_norm": 0.624969106257508,
"learning_rate": 3.930555678034628e-05,
"loss": 0.4071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4231489598751068,
"step": 760,
"valid_targets_mean": 4428.4,
"valid_targets_min": 1694
},
{
"epoch": 1.239870340356564,
"grad_norm": 0.7089448788566617,
"learning_rate": 3.9284286163487924e-05,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4825202226638794,
"step": 765,
"valid_targets_mean": 3411.8,
"valid_targets_min": 1277
},
{
"epoch": 1.2479740680713127,
"grad_norm": 0.759421400318165,
"learning_rate": 3.9262700616908006e-05,
"loss": 0.4374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4094354510307312,
"step": 770,
"valid_targets_mean": 2685.1,
"valid_targets_min": 952
},
{
"epoch": 1.2560777957860616,
"grad_norm": 0.5529348501565219,
"learning_rate": 3.924080049311791e-05,
"loss": 0.3975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37100690603256226,
"step": 775,
"valid_targets_mean": 4895.1,
"valid_targets_min": 1178
},
{
"epoch": 1.2641815235008105,
"grad_norm": 0.619539071217271,
"learning_rate": 3.921858614976632e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4086681604385376,
"step": 780,
"valid_targets_mean": 3785.5,
"valid_targets_min": 1038
},
{
"epoch": 1.2722852512155591,
"grad_norm": 0.5238357820823653,
"learning_rate": 3.919605794963343e-05,
"loss": 0.4185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39525216817855835,
"step": 785,
"valid_targets_mean": 5541.9,
"valid_targets_min": 1276
},
{
"epoch": 1.280388978930308,
"grad_norm": 0.5092409315061598,
"learning_rate": 3.9173216260624994e-05,
"loss": 0.4171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4608556628227234,
"step": 790,
"valid_targets_mean": 6425.1,
"valid_targets_min": 2062
},
{
"epoch": 1.2884927066450567,
"grad_norm": 0.6410692988138462,
"learning_rate": 3.915006145576632e-05,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.344308078289032,
"step": 795,
"valid_targets_mean": 3473.1,
"valid_targets_min": 1147
},
{
"epoch": 1.2965964343598055,
"grad_norm": 0.7056554788066899,
"learning_rate": 3.912659391319617e-05,
"loss": 0.4397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.483992338180542,
"step": 800,
"valid_targets_mean": 3135.4,
"valid_targets_min": 1593
},
{
"epoch": 1.3047001620745542,
"grad_norm": 0.4873176150043294,
"learning_rate": 3.910281401616061e-05,
"loss": 0.3886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34384751319885254,
"step": 805,
"valid_targets_mean": 5550.6,
"valid_targets_min": 1641
},
{
"epoch": 1.312803889789303,
"grad_norm": 0.6927361702376568,
"learning_rate": 3.907872215300672e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5015307664871216,
"step": 810,
"valid_targets_mean": 4136.8,
"valid_targets_min": 1319
},
{
"epoch": 1.320907617504052,
"grad_norm": 0.7312277221405057,
"learning_rate": 3.905431871717628e-05,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3949721157550812,
"step": 815,
"valid_targets_mean": 3217.5,
"valid_targets_min": 995
},
{
"epoch": 1.3290113452188006,
"grad_norm": 0.6697071515516008,
"learning_rate": 3.902960410719931e-05,
"loss": 0.3975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37480708956718445,
"step": 820,
"valid_targets_mean": 4123.7,
"valid_targets_min": 1396
},
{
"epoch": 1.3371150729335495,
"grad_norm": 0.672036926562655,
"learning_rate": 3.900457872668763e-05,
"loss": 0.4257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42396080493927,
"step": 825,
"valid_targets_mean": 3633.0,
"valid_targets_min": 1318
},
{
"epoch": 1.3452188006482984,
"grad_norm": 0.7642734408208844,
"learning_rate": 3.897924298432816e-05,
"loss": 0.4193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41950348019599915,
"step": 830,
"valid_targets_mean": 3189.9,
"valid_targets_min": 775
},
{
"epoch": 1.353322528363047,
"grad_norm": 0.6463330876952285,
"learning_rate": 3.895359729387636e-05,
"loss": 0.4157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39035725593566895,
"step": 835,
"valid_targets_mean": 3329.4,
"valid_targets_min": 1038
},
{
"epoch": 1.3614262560777957,
"grad_norm": 0.6294863371097716,
"learning_rate": 3.892764207414939e-05,
"loss": 0.3883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3504693806171417,
"step": 840,
"valid_targets_mean": 3639.1,
"valid_targets_min": 1118
},
{
"epoch": 1.3695299837925445,
"grad_norm": 0.7969453453498634,
"learning_rate": 3.890137774901931e-05,
"loss": 0.4373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46982237696647644,
"step": 845,
"valid_targets_mean": 3004.3,
"valid_targets_min": 1046
},
{
"epoch": 1.3776337115072934,
"grad_norm": 0.721881420599743,
"learning_rate": 3.887480474740616e-05,
"loss": 0.4039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4777338206768036,
"step": 850,
"valid_targets_mean": 3069.9,
"valid_targets_min": 1533
},
{
"epoch": 1.385737439222042,
"grad_norm": 0.6847253726579977,
"learning_rate": 3.8847923503270915e-05,
"loss": 0.4118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3960109353065491,
"step": 855,
"valid_targets_mean": 3656.4,
"valid_targets_min": 1090
},
{
"epoch": 1.393841166936791,
"grad_norm": 0.6216929584617436,
"learning_rate": 3.8820734455608464e-05,
"loss": 0.4082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4312170147895813,
"step": 860,
"valid_targets_mean": 4023.9,
"valid_targets_min": 954
},
{
"epoch": 1.4019448946515398,
"grad_norm": 0.5892956812304465,
"learning_rate": 3.879323804844038e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3535316586494446,
"step": 865,
"valid_targets_mean": 4127.8,
"valid_targets_min": 1471
},
{
"epoch": 1.4100486223662885,
"grad_norm": 0.8082279554048201,
"learning_rate": 3.876543473080771e-05,
"loss": 0.4261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4516857862472534,
"step": 870,
"valid_targets_mean": 3422.7,
"valid_targets_min": 1390
},
{
"epoch": 1.4181523500810373,
"grad_norm": 0.48789635530901226,
"learning_rate": 3.87373249567636e-05,
"loss": 0.4178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3681475818157196,
"step": 875,
"valid_targets_mean": 5620.6,
"valid_targets_min": 943
},
{
"epoch": 1.426256077795786,
"grad_norm": 0.6612612675219925,
"learning_rate": 3.870890918536592e-05,
"loss": 0.4047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38521233201026917,
"step": 880,
"valid_targets_mean": 3554.9,
"valid_targets_min": 826
},
{
"epoch": 1.4343598055105349,
"grad_norm": 0.6937842376936233,
"learning_rate": 3.8680187880669765e-05,
"loss": 0.4346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4324935972690582,
"step": 885,
"valid_targets_mean": 3092.2,
"valid_targets_min": 1330
},
{
"epoch": 1.4424635332252835,
"grad_norm": 0.6157750782438423,
"learning_rate": 3.865116151171983e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40046823024749756,
"step": 890,
"valid_targets_mean": 3759.9,
"valid_targets_min": 1438
},
{
"epoch": 1.4505672609400324,
"grad_norm": 0.7167528050751656,
"learning_rate": 3.8621830552542826e-05,
"loss": 0.4149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5026776194572449,
"step": 895,
"valid_targets_mean": 3752.6,
"valid_targets_min": 1342
},
{
"epoch": 1.4586709886547813,
"grad_norm": 0.8431157727162455,
"learning_rate": 3.859219548213965e-05,
"loss": 0.3728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35948169231414795,
"step": 900,
"valid_targets_mean": 4141.4,
"valid_targets_min": 982
},
{
"epoch": 1.46677471636953,
"grad_norm": 0.5786833063220671,
"learning_rate": 3.856225678447764e-05,
"loss": 0.3812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39766621589660645,
"step": 905,
"valid_targets_mean": 4228.1,
"valid_targets_min": 1376
},
{
"epoch": 1.4748784440842788,
"grad_norm": 0.7049559260095754,
"learning_rate": 3.853201494848263e-05,
"loss": 0.4019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41903460025787354,
"step": 910,
"valid_targets_mean": 2839.4,
"valid_targets_min": 1383
},
{
"epoch": 1.4829821717990275,
"grad_norm": 0.5730202377371769,
"learning_rate": 3.8501470468030984e-05,
"loss": 0.4318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40747907757759094,
"step": 915,
"valid_targets_mean": 3931.9,
"valid_targets_min": 1028
},
{
"epoch": 1.4910858995137763,
"grad_norm": 0.43206946086028963,
"learning_rate": 3.84706238419415e-05,
"loss": 0.3631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669350504875183,
"step": 920,
"valid_targets_mean": 5546.7,
"valid_targets_min": 905
},
{
"epoch": 1.499189627228525,
"grad_norm": 0.6471623110865716,
"learning_rate": 3.8439475573967315e-05,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4179629683494568,
"step": 925,
"valid_targets_mean": 4247.6,
"valid_targets_min": 1447
},
{
"epoch": 1.5072933549432739,
"grad_norm": 0.6122343718916604,
"learning_rate": 3.840802617278763e-05,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4195345640182495,
"step": 930,
"valid_targets_mean": 3743.9,
"valid_targets_min": 1011
},
{
"epoch": 1.5153970826580228,
"grad_norm": 0.5128272228930184,
"learning_rate": 3.837627615199942e-05,
"loss": 0.3743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3458319306373596,
"step": 935,
"valid_targets_mean": 4861.8,
"valid_targets_min": 1247
},
{
"epoch": 1.5235008103727714,
"grad_norm": 0.5372139985938604,
"learning_rate": 3.834422603010906e-05,
"loss": 0.3887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34437286853790283,
"step": 940,
"valid_targets_mean": 5274.9,
"valid_targets_min": 1164
},
{
"epoch": 1.5316045380875203,
"grad_norm": 0.7168389521153298,
"learning_rate": 3.831187633052384e-05,
"loss": 0.4173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5015881657600403,
"step": 945,
"valid_targets_mean": 4582.9,
"valid_targets_min": 1236
},
{
"epoch": 1.5397082658022692,
"grad_norm": 0.5084505658863171,
"learning_rate": 3.8279227581543424e-05,
"loss": 0.4032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3953602612018585,
"step": 950,
"valid_targets_mean": 4978.7,
"valid_targets_min": 1067
},
{
"epoch": 1.5478119935170178,
"grad_norm": 0.5907435331885859,
"learning_rate": 3.824628031635122e-05,
"loss": 0.4198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40457284450531006,
"step": 955,
"valid_targets_mean": 3979.6,
"valid_targets_min": 1202
},
{
"epoch": 1.5559157212317665,
"grad_norm": 0.6571353061058341,
"learning_rate": 3.8213035073005665e-05,
"loss": 0.4104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3425450325012207,
"step": 960,
"valid_targets_mean": 4567.8,
"valid_targets_min": 1203
},
{
"epoch": 1.5640194489465153,
"grad_norm": 0.679939959714484,
"learning_rate": 3.817949239443147e-05,
"loss": 0.3983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37692564725875854,
"step": 965,
"valid_targets_mean": 2661.4,
"valid_targets_min": 1105
},
{
"epoch": 1.5721231766612642,
"grad_norm": 0.530755056682054,
"learning_rate": 3.814565282841071e-05,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42367827892303467,
"step": 970,
"valid_targets_mean": 5225.1,
"valid_targets_min": 828
},
{
"epoch": 1.5802269043760129,
"grad_norm": 0.7466237984825811,
"learning_rate": 3.81115169275739e-05,
"loss": 0.4176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5087313055992126,
"step": 975,
"valid_targets_mean": 2849.9,
"valid_targets_min": 1079
},
{
"epoch": 1.5883306320907618,
"grad_norm": 0.5840496257255798,
"learning_rate": 3.8077085249390997e-05,
"loss": 0.385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3712337613105774,
"step": 980,
"valid_targets_mean": 3896.5,
"valid_targets_min": 1698
},
{
"epoch": 1.5964343598055106,
"grad_norm": 0.677800468030808,
"learning_rate": 3.8042358356162215e-05,
"loss": 0.4315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4169023036956787,
"step": 985,
"valid_targets_mean": 3102.1,
"valid_targets_min": 863
},
{
"epoch": 1.6045380875202593,
"grad_norm": 0.5126684483285767,
"learning_rate": 3.8007336815008945e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32481974363327026,
"step": 990,
"valid_targets_mean": 4557.1,
"valid_targets_min": 974
},
{
"epoch": 1.6126418152350082,
"grad_norm": 0.5972646097264587,
"learning_rate": 3.797202119786442e-05,
"loss": 0.4141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3950786590576172,
"step": 995,
"valid_targets_mean": 4294.4,
"valid_targets_min": 1126
},
{
"epoch": 1.620745542949757,
"grad_norm": 0.5937224848479558,
"learning_rate": 3.79364120814644e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3952077031135559,
"step": 1000,
"valid_targets_mean": 3905.6,
"valid_targets_min": 1188
},
{
"epoch": 1.6288492706645057,
"grad_norm": 0.6321038959683297,
"learning_rate": 3.790051004733775e-05,
"loss": 0.4201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42207908630371094,
"step": 1005,
"valid_targets_mean": 3878.1,
"valid_targets_min": 1058
},
{
"epoch": 1.6369529983792543,
"grad_norm": 1.1186970348539031,
"learning_rate": 3.786431568179697e-05,
"loss": 0.3937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3650881052017212,
"step": 1010,
"valid_targets_mean": 5200.1,
"valid_targets_min": 2239
},
{
"epoch": 1.6450567260940032,
"grad_norm": 0.5774237494154663,
"learning_rate": 3.7827829575928536e-05,
"loss": 0.3736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3719528913497925,
"step": 1015,
"valid_targets_mean": 4792.2,
"valid_targets_min": 733
},
{
"epoch": 1.653160453808752,
"grad_norm": 0.6601144475343061,
"learning_rate": 3.779105232558337e-05,
"loss": 0.4043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4179123044013977,
"step": 1020,
"valid_targets_mean": 3453.9,
"valid_targets_min": 759
},
{
"epoch": 1.6612641815235007,
"grad_norm": 0.503079426746597,
"learning_rate": 3.775398453136701e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31408727169036865,
"step": 1025,
"valid_targets_mean": 5430.4,
"valid_targets_min": 922
},
{
"epoch": 1.6693679092382496,
"grad_norm": 0.7753835008841552,
"learning_rate": 3.771662679862984e-05,
"loss": 0.3767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39880800247192383,
"step": 1030,
"valid_targets_mean": 2442.4,
"valid_targets_min": 1370
},
{
"epoch": 1.6774716369529985,
"grad_norm": 0.6991030543306379,
"learning_rate": 3.767897973745721e-05,
"loss": 0.4159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44633948802948,
"step": 1035,
"valid_targets_mean": 3597.4,
"valid_targets_min": 1057
},
{
"epoch": 1.6855753646677472,
"grad_norm": 0.7679002110960852,
"learning_rate": 3.764104396265946e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3935224711894989,
"step": 1040,
"valid_targets_mean": 3113.6,
"valid_targets_min": 1097
},
{
"epoch": 1.6936790923824958,
"grad_norm": 0.48586847500539443,
"learning_rate": 3.760282009376187e-05,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3813055157661438,
"step": 1045,
"valid_targets_mean": 4965.1,
"valid_targets_min": 1090
},
{
"epoch": 1.7017828200972447,
"grad_norm": 0.9069360496102079,
"learning_rate": 3.756430875499458e-05,
"loss": 0.4018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44932669401168823,
"step": 1050,
"valid_targets_mean": 2457.4,
"valid_targets_min": 1025
},
{
"epoch": 1.7098865478119936,
"grad_norm": 0.5147049425616307,
"learning_rate": 3.7525510575282354e-05,
"loss": 0.4147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3647802174091339,
"step": 1055,
"valid_targets_mean": 5582.6,
"valid_targets_min": 1001
},
{
"epoch": 1.7179902755267422,
"grad_norm": 0.5324879798136473,
"learning_rate": 3.748642618823432e-05,
"loss": 0.3832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3285607099533081,
"step": 1060,
"valid_targets_mean": 5071.8,
"valid_targets_min": 1431
},
{
"epoch": 1.726094003241491,
"grad_norm": 0.647787323939788,
"learning_rate": 3.744705623213365e-05,
"loss": 0.3851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4008070230484009,
"step": 1065,
"valid_targets_mean": 3614.9,
"valid_targets_min": 1114
},
{
"epoch": 1.73419773095624,
"grad_norm": 0.6619832349327134,
"learning_rate": 3.74074013499271e-05,
"loss": 0.4134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42244502902030945,
"step": 1070,
"valid_targets_mean": 3305.0,
"valid_targets_min": 1453
},
{
"epoch": 1.7423014586709886,
"grad_norm": 0.6542150803144281,
"learning_rate": 3.736746218921453e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42766737937927246,
"step": 1075,
"valid_targets_mean": 3408.0,
"valid_targets_min": 1420
},
{
"epoch": 1.7504051863857373,
"grad_norm": 0.7258838869557971,
"learning_rate": 3.732723940223832e-05,
"loss": 0.3782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39612990617752075,
"step": 1080,
"valid_targets_mean": 2531.2,
"valid_targets_min": 756
},
{
"epoch": 1.7585089141004864,
"grad_norm": 0.5910566163663715,
"learning_rate": 3.7286733645872726e-05,
"loss": 0.3818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4122849404811859,
"step": 1085,
"valid_targets_mean": 4625.3,
"valid_targets_min": 1063
},
{
"epoch": 1.766612641815235,
"grad_norm": 0.6433905775726179,
"learning_rate": 3.724594558161315e-05,
"loss": 0.4116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4537995755672455,
"step": 1090,
"valid_targets_mean": 3713.8,
"valid_targets_min": 1241
},
{
"epoch": 1.7747163695299837,
"grad_norm": 0.726822537416244,
"learning_rate": 3.720487587556534e-05,
"loss": 0.4445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46592673659324646,
"step": 1095,
"valid_targets_mean": 3423.6,
"valid_targets_min": 1516
},
{
"epoch": 1.7828200972447326,
"grad_norm": 0.5792115707093757,
"learning_rate": 3.716352519843448e-05,
"loss": 0.3869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3367713689804077,
"step": 1100,
"valid_targets_mean": 4104.1,
"valid_targets_min": 1400
},
{
"epoch": 1.7909238249594814,
"grad_norm": 0.6039687716465919,
"learning_rate": 3.712189422551431e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34517428278923035,
"step": 1105,
"valid_targets_mean": 3525.6,
"valid_targets_min": 628
},
{
"epoch": 1.79902755267423,
"grad_norm": 0.718725524451317,
"learning_rate": 3.7079983636676005e-05,
"loss": 0.4015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39871928095817566,
"step": 1110,
"valid_targets_mean": 3444.6,
"valid_targets_min": 1017
},
{
"epoch": 1.807131280388979,
"grad_norm": 0.6537149777525709,
"learning_rate": 3.703779411635714e-05,
"loss": 0.4066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3639248013496399,
"step": 1115,
"valid_targets_mean": 3092.6,
"valid_targets_min": 749
},
{
"epoch": 1.8152350081037278,
"grad_norm": 0.5629855946423489,
"learning_rate": 3.6995326353550515e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3245788514614105,
"step": 1120,
"valid_targets_mean": 4038.6,
"valid_targets_min": 1146
},
{
"epoch": 1.8233387358184765,
"grad_norm": 0.5734716036860011,
"learning_rate": 3.695258104179284e-05,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39152956008911133,
"step": 1125,
"valid_targets_mean": 4071.9,
"valid_targets_min": 1410
},
{
"epoch": 1.8314424635332252,
"grad_norm": 0.5854495000674845,
"learning_rate": 3.690955887915347e-05,
"loss": 0.4394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4314863085746765,
"step": 1130,
"valid_targets_mean": 4155.2,
"valid_targets_min": 1275
},
{
"epoch": 1.839546191247974,
"grad_norm": 0.5835121083788867,
"learning_rate": 3.686626056822298e-05,
"loss": 0.3728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3812408745288849,
"step": 1135,
"valid_targets_mean": 3790.1,
"valid_targets_min": 1133
},
{
"epoch": 1.847649918962723,
"grad_norm": 0.5390903203193496,
"learning_rate": 3.682268681610169e-05,
"loss": 0.4031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3393847942352295,
"step": 1140,
"valid_targets_mean": 4877.7,
"valid_targets_min": 1039
},
{
"epoch": 1.8557536466774716,
"grad_norm": 0.6666436255178859,
"learning_rate": 3.677883833438814e-05,
"loss": 0.38,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3733408451080322,
"step": 1145,
"valid_targets_mean": 2816.2,
"valid_targets_min": 993
},
{
"epoch": 1.8638573743922204,
"grad_norm": 0.6744209523213708,
"learning_rate": 3.6734715839167427e-05,
"loss": 0.3776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41044723987579346,
"step": 1150,
"valid_targets_mean": 2894.9,
"valid_targets_min": 1019
},
{
"epoch": 1.8719611021069693,
"grad_norm": 0.5776259559281988,
"learning_rate": 3.669032005099954e-05,
"loss": 0.3672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31816449761390686,
"step": 1155,
"valid_targets_mean": 3865.9,
"valid_targets_min": 961
},
{
"epoch": 1.880064829821718,
"grad_norm": 0.5069812438471043,
"learning_rate": 3.664565169490761e-05,
"loss": 0.3728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34008556604385376,
"step": 1160,
"valid_targets_mean": 5045.1,
"valid_targets_min": 1271
},
{
"epoch": 1.8881685575364666,
"grad_norm": 0.6393979867095283,
"learning_rate": 3.660071150036602e-05,
"loss": 0.3599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36201924085617065,
"step": 1165,
"valid_targets_mean": 3738.8,
"valid_targets_min": 1312
},
{
"epoch": 1.8962722852512157,
"grad_norm": 0.6385627539570938,
"learning_rate": 3.655550020128852e-05,
"loss": 0.4085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4077168107032776,
"step": 1170,
"valid_targets_mean": 3565.6,
"valid_targets_min": 1383
},
{
"epoch": 1.9043760129659644,
"grad_norm": 0.5922135114548367,
"learning_rate": 3.651001853601627e-05,
"loss": 0.4176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.405472993850708,
"step": 1175,
"valid_targets_mean": 3930.4,
"valid_targets_min": 1160
},
{
"epoch": 1.912479740680713,
"grad_norm": 0.589394070370728,
"learning_rate": 3.646426724730572e-05,
"loss": 0.3919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3850012421607971,
"step": 1180,
"valid_targets_mean": 3923.1,
"valid_targets_min": 1160
},
{
"epoch": 1.920583468395462,
"grad_norm": 0.4849462911152238,
"learning_rate": 3.641824708231653e-05,
"loss": 0.3806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3893633186817169,
"step": 1185,
"valid_targets_mean": 5844.6,
"valid_targets_min": 1425
},
{
"epoch": 1.9286871961102108,
"grad_norm": 0.4868660520441822,
"learning_rate": 3.6371958792599346e-05,
"loss": 0.3971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4328196048736572,
"step": 1190,
"valid_targets_mean": 5689.4,
"valid_targets_min": 891
},
{
"epoch": 1.9367909238249594,
"grad_norm": 0.7830835596596479,
"learning_rate": 3.632540313408353e-05,
"loss": 0.3763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37044936418533325,
"step": 1195,
"valid_targets_mean": 3209.5,
"valid_targets_min": 818
},
{
"epoch": 1.9448946515397083,
"grad_norm": 0.5564325863706703,
"learning_rate": 3.627858086706483e-05,
"loss": 0.4226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36431488394737244,
"step": 1200,
"valid_targets_mean": 4813.8,
"valid_targets_min": 1456
},
{
"epoch": 1.9529983792544572,
"grad_norm": 0.5822242628899343,
"learning_rate": 3.6231492756192924e-05,
"loss": 0.3924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37201085686683655,
"step": 1205,
"valid_targets_mean": 3925.2,
"valid_targets_min": 952
},
{
"epoch": 1.9611021069692058,
"grad_norm": 0.5299007245341597,
"learning_rate": 3.618413957045899e-05,
"loss": 0.3548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31111475825309753,
"step": 1210,
"valid_targets_mean": 4279.1,
"valid_targets_min": 1016
},
{
"epoch": 1.9692058346839545,
"grad_norm": 0.7156083555424475,
"learning_rate": 3.6136522083183096e-05,
"loss": 0.4136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4434228539466858,
"step": 1215,
"valid_targets_mean": 2801.8,
"valid_targets_min": 1138
},
{
"epoch": 1.9773095623987034,
"grad_norm": 0.7191486420410436,
"learning_rate": 3.608864107200159e-05,
"loss": 0.394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40111202001571655,
"step": 1220,
"valid_targets_mean": 3650.6,
"valid_targets_min": 959
},
{
"epoch": 1.9854132901134522,
"grad_norm": 0.7177268568233205,
"learning_rate": 3.604049731885442e-05,
"loss": 0.4102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4274698793888092,
"step": 1225,
"valid_targets_mean": 2859.1,
"valid_targets_min": 914
},
{
"epoch": 1.993517017828201,
"grad_norm": 0.5936165125904502,
"learning_rate": 3.599209160997234e-05,
"loss": 0.4041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4391655921936035,
"step": 1230,
"valid_targets_mean": 4539.0,
"valid_targets_min": 1030
},
{
"epoch": 2.0016207455429496,
"grad_norm": 0.6607150994416292,
"learning_rate": 3.594342473586406e-05,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3753243684768677,
"step": 1235,
"valid_targets_mean": 3325.9,
"valid_targets_min": 1040
},
{
"epoch": 2.0097244732576987,
"grad_norm": 0.6229919055152918,
"learning_rate": 3.589449749130337e-05,
"loss": 0.3713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3249698877334595,
"step": 1240,
"valid_targets_mean": 3667.4,
"valid_targets_min": 1301
},
{
"epoch": 2.0178282009724473,
"grad_norm": 0.596009922929333,
"learning_rate": 3.5845310675316134e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35430464148521423,
"step": 1245,
"valid_targets_mean": 4640.9,
"valid_targets_min": 1234
},
{
"epoch": 2.025931928687196,
"grad_norm": 0.6380265961179253,
"learning_rate": 3.5795865091167266e-05,
"loss": 0.3419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33436498045921326,
"step": 1250,
"valid_targets_mean": 3602.1,
"valid_targets_min": 1405
},
{
"epoch": 2.034035656401945,
"grad_norm": 0.6162634046057834,
"learning_rate": 3.574616154634758e-05,
"loss": 0.3513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.321361780166626,
"step": 1255,
"valid_targets_mean": 3951.0,
"valid_targets_min": 1218
},
{
"epoch": 2.0421393841166937,
"grad_norm": 0.8549853836990146,
"learning_rate": 3.569620085256062e-05,
"loss": 0.3671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34706395864486694,
"step": 1260,
"valid_targets_mean": 2600.3,
"valid_targets_min": 1178
},
{
"epoch": 2.0502431118314424,
"grad_norm": 0.6157850695159539,
"learning_rate": 3.564598382570943e-05,
"loss": 0.3577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31989988684654236,
"step": 1265,
"valid_targets_mean": 3471.0,
"valid_targets_min": 991
},
{
"epoch": 2.0583468395461915,
"grad_norm": 0.6912760968032348,
"learning_rate": 3.559551128588316e-05,
"loss": 0.3561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3643125295639038,
"step": 1270,
"valid_targets_mean": 3251.2,
"valid_targets_min": 1369
},
{
"epoch": 2.06645056726094,
"grad_norm": 0.7610727310356797,
"learning_rate": 3.5544784057343746e-05,
"loss": 0.3989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44861117005348206,
"step": 1275,
"valid_targets_mean": 2874.9,
"valid_targets_min": 1049
},
{
"epoch": 2.0745542949756888,
"grad_norm": 0.5567253168047179,
"learning_rate": 3.549380296851242e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34195390343666077,
"step": 1280,
"valid_targets_mean": 4699.7,
"valid_targets_min": 1283
},
{
"epoch": 2.0826580226904374,
"grad_norm": 0.6193215633518243,
"learning_rate": 3.544256885195616e-05,
"loss": 0.3697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36366885900497437,
"step": 1285,
"valid_targets_mean": 4513.9,
"valid_targets_min": 1327
},
{
"epoch": 2.0907617504051865,
"grad_norm": 0.6104236788483114,
"learning_rate": 3.539108254437414e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3442176580429077,
"step": 1290,
"valid_targets_mean": 4325.1,
"valid_targets_min": 1184
},
{
"epoch": 2.098865478119935,
"grad_norm": 1.1540653788876254,
"learning_rate": 3.5339344886584015e-05,
"loss": 0.3837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47065746784210205,
"step": 1295,
"valid_targets_mean": 4431.3,
"valid_targets_min": 1418
},
{
"epoch": 2.106969205834684,
"grad_norm": 0.6313032622328161,
"learning_rate": 3.5287356723508245e-05,
"loss": 0.3774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3796147108078003,
"step": 1300,
"valid_targets_mean": 3835.1,
"valid_targets_min": 1712
},
{
"epoch": 2.115072933549433,
"grad_norm": 0.5995277124296124,
"learning_rate": 3.523511890416023e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3411373496055603,
"step": 1305,
"valid_targets_mean": 4134.9,
"valid_targets_min": 1533
},
{
"epoch": 2.1231766612641816,
"grad_norm": 0.6323877139662327,
"learning_rate": 3.518263228163051e-05,
"loss": 0.3738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3897821605205536,
"step": 1310,
"valid_targets_mean": 3811.7,
"valid_targets_min": 1073
},
{
"epoch": 2.1312803889789302,
"grad_norm": 0.6142230133720461,
"learning_rate": 3.51298977130728e-05,
"loss": 0.3768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35401493310928345,
"step": 1315,
"valid_targets_mean": 4104.4,
"valid_targets_min": 1090
},
{
"epoch": 2.139384116693679,
"grad_norm": 0.575159991305633,
"learning_rate": 3.507691605968997e-05,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3774334788322449,
"step": 1320,
"valid_targets_mean": 4597.1,
"valid_targets_min": 1139
},
{
"epoch": 2.147487844408428,
"grad_norm": 0.650651417151311,
"learning_rate": 3.5023688186720047e-05,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3409254550933838,
"step": 1325,
"valid_targets_mean": 3917.1,
"valid_targets_min": 1170
},
{
"epoch": 2.1555915721231766,
"grad_norm": 0.520190676285313,
"learning_rate": 3.497021496342203e-05,
"loss": 0.3525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37429600954055786,
"step": 1330,
"valid_targets_mean": 5373.3,
"valid_targets_min": 1456
},
{
"epoch": 2.1636952998379253,
"grad_norm": 0.8766333160570894,
"learning_rate": 3.491649726306168e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45493656396865845,
"step": 1335,
"valid_targets_mean": 3073.1,
"valid_targets_min": 1138
},
{
"epoch": 2.1717990275526744,
"grad_norm": 0.48924493035671224,
"learning_rate": 3.486253596289734e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3554176092147827,
"step": 1340,
"valid_targets_mean": 8016.4,
"valid_targets_min": 1256
},
{
"epoch": 2.179902755267423,
"grad_norm": 0.6152012628911511,
"learning_rate": 3.4808331944165524e-05,
"loss": 0.3655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33981600403785706,
"step": 1345,
"valid_targets_mean": 3537.2,
"valid_targets_min": 1047
},
{
"epoch": 2.1880064829821717,
"grad_norm": 0.5302271963442517,
"learning_rate": 3.4753886092066546e-05,
"loss": 0.337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537047564983368,
"step": 1350,
"valid_targets_mean": 5067.1,
"valid_targets_min": 1520
},
{
"epoch": 2.1961102106969204,
"grad_norm": 0.6367347476094577,
"learning_rate": 3.469919929575012e-05,
"loss": 0.3537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.347379207611084,
"step": 1355,
"valid_targets_mean": 3530.1,
"valid_targets_min": 358
},
{
"epoch": 2.2042139384116695,
"grad_norm": 7.616842383691646,
"learning_rate": 3.464427244830076e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3965144455432892,
"step": 1360,
"valid_targets_mean": 4835.8,
"valid_targets_min": 922
},
{
"epoch": 2.212317666126418,
"grad_norm": 0.5772928971804826,
"learning_rate": 3.458910644672324e-05,
"loss": 0.3315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3225036859512329,
"step": 1365,
"valid_targets_mean": 4137.2,
"valid_targets_min": 1041
},
{
"epoch": 2.2204213938411668,
"grad_norm": 0.7652072059945616,
"learning_rate": 3.453370219192794e-05,
"loss": 0.3621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3325500786304474,
"step": 1370,
"valid_targets_mean": 3532.5,
"valid_targets_min": 1434
},
{
"epoch": 2.228525121555916,
"grad_norm": 0.6273654869200413,
"learning_rate": 3.4478060588716116e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3371928632259369,
"step": 1375,
"valid_targets_mean": 4380.4,
"valid_targets_min": 1101
},
{
"epoch": 2.2366288492706645,
"grad_norm": 0.5330490634477026,
"learning_rate": 3.442218254576516e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30799007415771484,
"step": 1380,
"valid_targets_mean": 4405.8,
"valid_targets_min": 1395
},
{
"epoch": 2.244732576985413,
"grad_norm": 0.6034321724192573,
"learning_rate": 3.436606897561372e-05,
"loss": 0.3584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3362310528755188,
"step": 1385,
"valid_targets_mean": 3742.8,
"valid_targets_min": 1574
},
{
"epoch": 2.2528363047001623,
"grad_norm": 0.6490329309441155,
"learning_rate": 3.430972079464682e-05,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34692591428756714,
"step": 1390,
"valid_targets_mean": 3377.1,
"valid_targets_min": 886
},
{
"epoch": 2.260940032414911,
"grad_norm": 0.6561577805947444,
"learning_rate": 3.425313892308089e-05,
"loss": 0.3798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47548946738243103,
"step": 1395,
"valid_targets_mean": 4475.6,
"valid_targets_min": 868
},
{
"epoch": 2.2690437601296596,
"grad_norm": 0.7213768996297372,
"learning_rate": 3.419632428494873e-05,
"loss": 0.3854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45764851570129395,
"step": 1400,
"valid_targets_mean": 3668.8,
"valid_targets_min": 784
},
{
"epoch": 2.2771474878444082,
"grad_norm": 0.676480480135692,
"learning_rate": 3.413927780808443e-05,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36912989616394043,
"step": 1405,
"valid_targets_mean": 3886.9,
"valid_targets_min": 642
},
{
"epoch": 2.2852512155591573,
"grad_norm": 0.6377817982477058,
"learning_rate": 3.4082000424108235e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43174880743026733,
"step": 1410,
"valid_targets_mean": 4233.6,
"valid_targets_min": 1040
},
{
"epoch": 2.293354943273906,
"grad_norm": 0.5519348419998006,
"learning_rate": 3.402449306841128e-05,
"loss": 0.3967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31168171763420105,
"step": 1415,
"valid_targets_mean": 4307.8,
"valid_targets_min": 1098
},
{
"epoch": 2.3014586709886546,
"grad_norm": 0.7505030716064821,
"learning_rate": 3.396675668014035e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37064194679260254,
"step": 1420,
"valid_targets_mean": 3508.5,
"valid_targets_min": 971
},
{
"epoch": 2.3095623987034037,
"grad_norm": 0.6153586073602998,
"learning_rate": 3.390879220218258e-05,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.324023574590683,
"step": 1425,
"valid_targets_mean": 3714.1,
"valid_targets_min": 1192
},
{
"epoch": 2.3176661264181524,
"grad_norm": 0.6047177695229424,
"learning_rate": 3.385060058114995e-05,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36816906929016113,
"step": 1430,
"valid_targets_mean": 4465.9,
"valid_targets_min": 1218
},
{
"epoch": 2.325769854132901,
"grad_norm": 0.554001360948358,
"learning_rate": 3.379218276736393e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32747846841812134,
"step": 1435,
"valid_targets_mean": 4328.4,
"valid_targets_min": 1183
},
{
"epoch": 2.3338735818476497,
"grad_norm": 0.7300247951181067,
"learning_rate": 3.373353971483992e-05,
"loss": 0.3827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39081335067749023,
"step": 1440,
"valid_targets_mean": 3143.4,
"valid_targets_min": 897
},
{
"epoch": 2.341977309562399,
"grad_norm": 0.7887680824193282,
"learning_rate": 3.367467238127165e-05,
"loss": 0.353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4153595268726349,
"step": 1445,
"valid_targets_mean": 2644.9,
"valid_targets_min": 1132
},
{
"epoch": 2.3500810372771475,
"grad_norm": 0.6128981493620611,
"learning_rate": 3.361558172801558e-05,
"loss": 0.3464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3145619034767151,
"step": 1450,
"valid_targets_mean": 3406.1,
"valid_targets_min": 951
},
{
"epoch": 2.358184764991896,
"grad_norm": 0.7057939890319916,
"learning_rate": 3.355626872007518e-05,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43307170271873474,
"step": 1455,
"valid_targets_mean": 3228.0,
"valid_targets_min": 1237
},
{
"epoch": 2.366288492706645,
"grad_norm": 1.245387675691084,
"learning_rate": 3.3496734326085154e-05,
"loss": 0.3844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5461128950119019,
"step": 1460,
"valid_targets_mean": 3818.5,
"valid_targets_min": 973
},
{
"epoch": 2.374392220421394,
"grad_norm": 0.7974141939772306,
"learning_rate": 3.3436979518295674e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39469295740127563,
"step": 1465,
"valid_targets_mean": 2919.4,
"valid_targets_min": 964
},
{
"epoch": 2.3824959481361425,
"grad_norm": 0.7108670533735841,
"learning_rate": 3.337700527255643e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3202032744884491,
"step": 1470,
"valid_targets_mean": 4618.8,
"valid_targets_min": 1204
},
{
"epoch": 2.3905996758508916,
"grad_norm": 0.7412244458586731,
"learning_rate": 3.331681256830074e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3399648666381836,
"step": 1475,
"valid_targets_mean": 3429.4,
"valid_targets_min": 1292
},
{
"epoch": 2.3987034035656403,
"grad_norm": 0.5383118278414649,
"learning_rate": 3.325640238852958e-05,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3444640636444092,
"step": 1480,
"valid_targets_mean": 5254.6,
"valid_targets_min": 1150
},
{
"epoch": 2.406807131280389,
"grad_norm": 0.5928053691323958,
"learning_rate": 3.319577571979544e-05,
"loss": 0.3871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40096884965896606,
"step": 1485,
"valid_targets_mean": 4633.4,
"valid_targets_min": 1176
},
{
"epoch": 2.4149108589951376,
"grad_norm": 0.5049795409180116,
"learning_rate": 3.313493355218632e-05,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43719810247421265,
"step": 1490,
"valid_targets_mean": 6272.6,
"valid_targets_min": 981
},
{
"epoch": 2.4230145867098867,
"grad_norm": 0.8353029407587053,
"learning_rate": 3.307387687930947e-05,
"loss": 0.3483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41381019353866577,
"step": 1495,
"valid_targets_mean": 2182.9,
"valid_targets_min": 962
},
{
"epoch": 2.4311183144246353,
"grad_norm": 0.8126079203284331,
"learning_rate": 3.301260669827524e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40541964769363403,
"step": 1500,
"valid_targets_mean": 2986.6,
"valid_targets_min": 983
},
{
"epoch": 2.439222042139384,
"grad_norm": 0.641139311735153,
"learning_rate": 3.295112400968073e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36821722984313965,
"step": 1505,
"valid_targets_mean": 3650.5,
"valid_targets_min": 1287
},
{
"epoch": 2.447325769854133,
"grad_norm": 0.720372072556044,
"learning_rate": 3.2889429817593494e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3299311697483063,
"step": 1510,
"valid_targets_mean": 2849.4,
"valid_targets_min": 1233
},
{
"epoch": 2.4554294975688817,
"grad_norm": 0.6615710856738938,
"learning_rate": 3.2827525129535135e-05,
"loss": 0.3528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4220331311225891,
"step": 1515,
"valid_targets_mean": 3493.5,
"valid_targets_min": 813
},
{
"epoch": 2.4635332252836304,
"grad_norm": 0.6267811677605671,
"learning_rate": 3.276541095646482e-05,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4255092740058899,
"step": 1520,
"valid_targets_mean": 4085.3,
"valid_targets_min": 1327
},
{
"epoch": 2.471636952998379,
"grad_norm": 0.6283412448611168,
"learning_rate": 3.2703088312762825e-05,
"loss": 0.3746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37167081236839294,
"step": 1525,
"valid_targets_mean": 3667.0,
"valid_targets_min": 1152
},
{
"epoch": 2.479740680713128,
"grad_norm": 0.6150481887647228,
"learning_rate": 3.2640558216213914e-05,
"loss": 0.3525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3558899164199829,
"step": 1530,
"valid_targets_mean": 3783.0,
"valid_targets_min": 987
},
{
"epoch": 2.487844408427877,
"grad_norm": 0.7059041076787986,
"learning_rate": 3.2577821687990764e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39561814069747925,
"step": 1535,
"valid_targets_mean": 3271.9,
"valid_targets_min": 995
},
{
"epoch": 2.4959481361426255,
"grad_norm": 0.6347284403899237,
"learning_rate": 3.2514879752637236e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.359174907207489,
"step": 1540,
"valid_targets_mean": 3839.1,
"valid_targets_min": 1142
},
{
"epoch": 2.5040518638573745,
"grad_norm": 0.695347992645094,
"learning_rate": 3.2451733438051705e-05,
"loss": 0.4004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4211786687374115,
"step": 1545,
"valid_targets_mean": 3237.3,
"valid_targets_min": 1200
},
{
"epoch": 2.512155591572123,
"grad_norm": 0.6572998579365059,
"learning_rate": 3.238838377547023e-05,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31920304894447327,
"step": 1550,
"valid_targets_mean": 3640.3,
"valid_targets_min": 666
},
{
"epoch": 2.520259319286872,
"grad_norm": 0.6183228297803092,
"learning_rate": 3.2324831799449724e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3397529721260071,
"step": 1555,
"valid_targets_mean": 3801.9,
"valid_targets_min": 1076
},
{
"epoch": 2.528363047001621,
"grad_norm": 0.5922882925500382,
"learning_rate": 3.226107854785106e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40487492084503174,
"step": 1560,
"valid_targets_mean": 4336.1,
"valid_targets_min": 1168
},
{
"epoch": 2.5364667747163696,
"grad_norm": 0.5505805672615378,
"learning_rate": 3.2197125061822135e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30663758516311646,
"step": 1565,
"valid_targets_mean": 5709.7,
"valid_targets_min": 1193
},
{
"epoch": 2.5445705024311183,
"grad_norm": 0.6592707151602514,
"learning_rate": 3.213297238578082e-05,
"loss": 0.3713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3352968096733093,
"step": 1570,
"valid_targets_mean": 3024.6,
"valid_targets_min": 370
},
{
"epoch": 2.5526742301458674,
"grad_norm": 0.6837888385824673,
"learning_rate": 3.206862156739799e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3527699410915375,
"step": 1575,
"valid_targets_mean": 3217.2,
"valid_targets_min": 1165
},
{
"epoch": 2.560777957860616,
"grad_norm": 0.5714278693915779,
"learning_rate": 3.2004073657580314e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3621138334274292,
"step": 1580,
"valid_targets_mean": 5215.3,
"valid_targets_min": 1660
},
{
"epoch": 2.5688816855753647,
"grad_norm": 0.632687459517687,
"learning_rate": 3.193932971045316e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.378584623336792,
"step": 1585,
"valid_targets_mean": 3656.8,
"valid_targets_min": 1012
},
{
"epoch": 2.5769854132901133,
"grad_norm": 0.5154328163710282,
"learning_rate": 3.187439078334338e-05,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569686770439148,
"step": 1590,
"valid_targets_mean": 4438.7,
"valid_targets_min": 1003
},
{
"epoch": 2.585089141004862,
"grad_norm": 0.8485853331997644,
"learning_rate": 3.180925793676199e-05,
"loss": 0.375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4228053689002991,
"step": 1595,
"valid_targets_mean": 2364.7,
"valid_targets_min": 985
},
{
"epoch": 2.593192868719611,
"grad_norm": 0.6385223754745202,
"learning_rate": 3.1743932234386905e-05,
"loss": 0.3582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33268439769744873,
"step": 1600,
"valid_targets_mean": 3510.6,
"valid_targets_min": 1022
},
{
"epoch": 2.6012965964343597,
"grad_norm": 0.6203925952713126,
"learning_rate": 3.167841474304555e-05,
"loss": 0.3524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35235142707824707,
"step": 1605,
"valid_targets_mean": 4186.2,
"valid_targets_min": 1441
},
{
"epoch": 2.6094003241491084,
"grad_norm": 0.6407113023621984,
"learning_rate": 3.161270653269743e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37132495641708374,
"step": 1610,
"valid_targets_mean": 3792.4,
"valid_targets_min": 1169
},
{
"epoch": 2.6175040518638575,
"grad_norm": 0.787376412545527,
"learning_rate": 3.154680867641666e-05,
"loss": 0.3786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3557274639606476,
"step": 1615,
"valid_targets_mean": 2341.8,
"valid_targets_min": 874
},
{
"epoch": 2.625607779578606,
"grad_norm": 0.7020441242654781,
"learning_rate": 3.1480722250374454e-05,
"loss": 0.3702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3731013536453247,
"step": 1620,
"valid_targets_mean": 3057.1,
"valid_targets_min": 1061
},
{
"epoch": 2.633711507293355,
"grad_norm": 0.6408600597666677,
"learning_rate": 3.1414448333821526e-05,
"loss": 0.3524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3454047441482544,
"step": 1625,
"valid_targets_mean": 3993.4,
"valid_targets_min": 1023
},
{
"epoch": 2.641815235008104,
"grad_norm": 0.4902024972171765,
"learning_rate": 3.1347988009070496e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34175369143486023,
"step": 1630,
"valid_targets_mean": 6449.6,
"valid_targets_min": 1164
},
{
"epoch": 2.6499189627228525,
"grad_norm": 0.6120518005314733,
"learning_rate": 3.1281342361478184e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40884333848953247,
"step": 1635,
"valid_targets_mean": 4059.9,
"valid_targets_min": 979
},
{
"epoch": 2.658022690437601,
"grad_norm": 0.6771620012648307,
"learning_rate": 3.121451247942789e-05,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38433632254600525,
"step": 1640,
"valid_targets_mean": 4274.3,
"valid_targets_min": 856
},
{
"epoch": 2.6661264181523503,
"grad_norm": 0.5457628190492216,
"learning_rate": 3.1147499454311654e-05,
"loss": 0.4067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3678765892982483,
"step": 1645,
"valid_targets_mean": 5149.6,
"valid_targets_min": 1689
},
{
"epoch": 2.674230145867099,
"grad_norm": 0.627604755543937,
"learning_rate": 3.1080304380512386e-05,
"loss": 0.3641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4083409309387207,
"step": 1650,
"valid_targets_mean": 4076.5,
"valid_targets_min": 1109
},
{
"epoch": 2.6823338735818476,
"grad_norm": 1.1030374170315973,
"learning_rate": 3.101292835538602e-05,
"loss": 0.3886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4205278158187866,
"step": 1655,
"valid_targets_mean": 2480.2,
"valid_targets_min": 1100
},
{
"epoch": 2.6904376012965967,
"grad_norm": 0.7339764425274315,
"learning_rate": 3.0945372479243605e-05,
"loss": 0.3464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35320383310317993,
"step": 1660,
"valid_targets_mean": 2801.6,
"valid_targets_min": 1023
},
{
"epoch": 2.6985413290113454,
"grad_norm": 0.6863535808248586,
"learning_rate": 3.087763785533328e-05,
"loss": 0.3789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4404126703739166,
"step": 1665,
"valid_targets_mean": 3782.9,
"valid_targets_min": 1136
},
{
"epoch": 2.706645056726094,
"grad_norm": 0.7168705430931214,
"learning_rate": 3.0809725589822325e-05,
"loss": 0.3784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3114071190357208,
"step": 1670,
"valid_targets_mean": 2838.5,
"valid_targets_min": 1215
},
{
"epoch": 2.7147487844408427,
"grad_norm": 0.6556363386210516,
"learning_rate": 3.074163679177907e-05,
"loss": 0.3592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36680227518081665,
"step": 1675,
"valid_targets_mean": 3425.0,
"valid_targets_min": 1262
},
{
"epoch": 2.7228525121555913,
"grad_norm": 0.7037719475710038,
"learning_rate": 3.067337257315477e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3956286311149597,
"step": 1680,
"valid_targets_mean": 3108.4,
"valid_targets_min": 1175
},
{
"epoch": 2.7309562398703404,
"grad_norm": 0.5316241938449401,
"learning_rate": 3.0604934048765444e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28850430250167847,
"step": 1685,
"valid_targets_mean": 4587.1,
"valid_targets_min": 1823
},
{
"epoch": 2.739059967585089,
"grad_norm": 0.7055812576851976,
"learning_rate": 3.05363223362737e-05,
"loss": 0.3812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38997015357017517,
"step": 1690,
"valid_targets_mean": 3222.5,
"valid_targets_min": 1028
},
{
"epoch": 2.7471636952998377,
"grad_norm": 0.664731751727158,
"learning_rate": 3.0467538556170463e-05,
"loss": 0.36,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32559171319007874,
"step": 1695,
"valid_targets_mean": 2939.7,
"valid_targets_min": 765
},
{
"epoch": 2.755267423014587,
"grad_norm": 0.5783986029196682,
"learning_rate": 3.0398583831756655e-05,
"loss": 0.3368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3600800633430481,
"step": 1700,
"valid_targets_mean": 4368.5,
"valid_targets_min": 1327
},
{
"epoch": 2.7633711507293355,
"grad_norm": 0.611412124205423,
"learning_rate": 3.03294592891249e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33210447430610657,
"step": 1705,
"valid_targets_mean": 4879.0,
"valid_targets_min": 1231
},
{
"epoch": 2.771474878444084,
"grad_norm": 0.557474285200355,
"learning_rate": 3.0260166057141086e-05,
"loss": 0.3625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32921281456947327,
"step": 1710,
"valid_targets_mean": 4460.2,
"valid_targets_min": 1413
},
{
"epoch": 2.7795786061588332,
"grad_norm": 0.5043150540097012,
"learning_rate": 3.0190705267425956e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2847195863723755,
"step": 1715,
"valid_targets_mean": 4976.2,
"valid_targets_min": 1237
},
{
"epoch": 2.787682333873582,
"grad_norm": 0.5706697755674613,
"learning_rate": 3.0121078054336633e-05,
"loss": 0.3416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3246619701385498,
"step": 1720,
"valid_targets_mean": 4126.2,
"valid_targets_min": 1436
},
{
"epoch": 2.7957860615883305,
"grad_norm": 0.6778117045066955,
"learning_rate": 3.005128555494806e-05,
"loss": 0.3771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36269962787628174,
"step": 1725,
"valid_targets_mean": 3297.2,
"valid_targets_min": 1201
},
{
"epoch": 2.8038897893030796,
"grad_norm": 0.5794849455469647,
"learning_rate": 2.998132890903448e-05,
"loss": 0.3473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.330091655254364,
"step": 1730,
"valid_targets_mean": 3850.0,
"valid_targets_min": 1070
},
{
"epoch": 2.8119935170178283,
"grad_norm": 0.6007475248043017,
"learning_rate": 2.9911209259050763e-05,
"loss": 0.354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35253655910491943,
"step": 1735,
"valid_targets_mean": 4133.7,
"valid_targets_min": 1510
},
{
"epoch": 2.820097244732577,
"grad_norm": 0.5841323161644045,
"learning_rate": 2.984092775011382e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3201521635055542,
"step": 1740,
"valid_targets_mean": 4134.8,
"valid_targets_min": 1065
},
{
"epoch": 2.828200972447326,
"grad_norm": 0.7336317690567647,
"learning_rate": 2.9770485529983834e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44161343574523926,
"step": 1745,
"valid_targets_mean": 2970.2,
"valid_targets_min": 991
},
{
"epoch": 2.8363047001620747,
"grad_norm": 0.6635532459963542,
"learning_rate": 2.9699883749045564e-05,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3493614196777344,
"step": 1750,
"valid_targets_mean": 3285.0,
"valid_targets_min": 626
},
{
"epoch": 2.8444084278768234,
"grad_norm": 0.5027187622458136,
"learning_rate": 2.962912356028953e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3354187309741974,
"step": 1755,
"valid_targets_mean": 4720.4,
"valid_targets_min": 1170
},
{
"epoch": 2.852512155591572,
"grad_norm": 0.6901547177308334,
"learning_rate": 2.95582061192932e-05,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3903937339782715,
"step": 1760,
"valid_targets_mean": 3206.8,
"valid_targets_min": 1276
},
{
"epoch": 2.8606158833063207,
"grad_norm": 0.5708803489808794,
"learning_rate": 2.9487132584202115e-05,
"loss": 0.3831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3380119800567627,
"step": 1765,
"valid_targets_mean": 3977.0,
"valid_targets_min": 1095
},
{
"epoch": 2.8687196110210698,
"grad_norm": 0.5085623418043083,
"learning_rate": 2.9415904115710964e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34908628463745117,
"step": 1770,
"valid_targets_mean": 4955.4,
"valid_targets_min": 1178
},
{
"epoch": 2.8768233387358184,
"grad_norm": 0.6051208343777774,
"learning_rate": 2.9344521877044633e-05,
"loss": 0.3787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4075632691383362,
"step": 1775,
"valid_targets_mean": 4224.0,
"valid_targets_min": 349
},
{
"epoch": 2.884927066450567,
"grad_norm": 0.5855062840025109,
"learning_rate": 2.927298703393924e-05,
"loss": 0.3579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3283981680870056,
"step": 1780,
"valid_targets_mean": 4081.2,
"valid_targets_min": 959
},
{
"epoch": 2.893030794165316,
"grad_norm": 0.6371935770846757,
"learning_rate": 2.9201300754623046e-05,
"loss": 0.3729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3392450511455536,
"step": 1785,
"valid_targets_mean": 3568.0,
"valid_targets_min": 1160
},
{
"epoch": 2.901134521880065,
"grad_norm": 0.4278974307253599,
"learning_rate": 2.9129464209797404e-05,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865206003189087,
"step": 1790,
"valid_targets_mean": 6328.2,
"valid_targets_min": 1058
},
{
"epoch": 2.9092382495948135,
"grad_norm": 0.5505126981477363,
"learning_rate": 2.9057478572617644e-05,
"loss": 0.3201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.337314248085022,
"step": 1795,
"valid_targets_mean": 4826.6,
"valid_targets_min": 1736
},
{
"epoch": 2.9173419773095626,
"grad_norm": 0.7805624719946108,
"learning_rate": 2.898534501867391e-05,
"loss": 0.376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4011368751525879,
"step": 1800,
"valid_targets_mean": 2397.6,
"valid_targets_min": 898
},
{
"epoch": 2.9254457050243112,
"grad_norm": 0.5482087600129742,
"learning_rate": 2.8913064725971947e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3068529963493347,
"step": 1805,
"valid_targets_mean": 5494.9,
"valid_targets_min": 1006
},
{
"epoch": 2.93354943273906,
"grad_norm": 0.9936321479400723,
"learning_rate": 2.8840638874913894e-05,
"loss": 0.3868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40905821323394775,
"step": 1810,
"valid_targets_mean": 3718.8,
"valid_targets_min": 1419
},
{
"epoch": 2.941653160453809,
"grad_norm": 0.5736879552202689,
"learning_rate": 2.8768068648278976e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39087069034576416,
"step": 1815,
"valid_targets_mean": 4475.4,
"valid_targets_min": 1388
},
{
"epoch": 2.9497568881685576,
"grad_norm": 0.6756877628799013,
"learning_rate": 2.8695355231204206e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3940260112285614,
"step": 1820,
"valid_targets_mean": 3155.6,
"valid_targets_min": 463
},
{
"epoch": 2.9578606158833063,
"grad_norm": 0.5794570379139724,
"learning_rate": 2.862249981116502e-05,
"loss": 0.3382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3015279173851013,
"step": 1825,
"valid_targets_mean": 4283.2,
"valid_targets_min": 1192
},
{
"epoch": 2.965964343598055,
"grad_norm": 0.6037397342964902,
"learning_rate": 2.854950357795589e-05,
"loss": 0.3597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3510607182979584,
"step": 1830,
"valid_targets_mean": 3907.7,
"valid_targets_min": 1421
},
{
"epoch": 2.974068071312804,
"grad_norm": 0.6184387967781734,
"learning_rate": 2.847636772367091e-05,
"loss": 0.3505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3586122989654541,
"step": 1835,
"valid_targets_mean": 3820.1,
"valid_targets_min": 1575
},
{
"epoch": 2.9821717990275527,
"grad_norm": 0.6530052932759616,
"learning_rate": 2.8403093442684287e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4493202865123749,
"step": 1840,
"valid_targets_mean": 3684.6,
"valid_targets_min": 1219
},
{
"epoch": 2.9902755267423013,
"grad_norm": 0.5322411565499487,
"learning_rate": 2.8329681931630877e-05,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34222137928009033,
"step": 1845,
"valid_targets_mean": 4850.8,
"valid_targets_min": 1409
},
{
"epoch": 2.99837925445705,
"grad_norm": 0.5810539949314576,
"learning_rate": 2.825613438938663e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3474220931529999,
"step": 1850,
"valid_targets_mean": 4159.3,
"valid_targets_min": 1442
},
{
"epoch": 3.006482982171799,
"grad_norm": 0.5876530626626576,
"learning_rate": 2.8182452017048983e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3032858371734619,
"step": 1855,
"valid_targets_mean": 3758.8,
"valid_targets_min": 1413
},
{
"epoch": 3.0145867098865478,
"grad_norm": 0.6532906368770814,
"learning_rate": 2.81086360179173e-05,
"loss": 0.3592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3261423707008362,
"step": 1860,
"valid_targets_mean": 3757.5,
"valid_targets_min": 1124
},
{
"epoch": 3.0226904376012964,
"grad_norm": 0.6768457925442797,
"learning_rate": 2.8034687597473164e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33774706721305847,
"step": 1865,
"valid_targets_mean": 3208.4,
"valid_targets_min": 1392
},
{
"epoch": 3.0307941653160455,
"grad_norm": 0.6026553451116088,
"learning_rate": 2.796060796336074e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3198626637458801,
"step": 1870,
"valid_targets_mean": 4000.1,
"valid_targets_min": 1044
},
{
"epoch": 3.038897893030794,
"grad_norm": 0.6424620557357676,
"learning_rate": 2.7886398325367018e-05,
"loss": 0.3378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2810208797454834,
"step": 1875,
"valid_targets_mean": 3380.9,
"valid_targets_min": 759
},
{
"epoch": 3.047001620745543,
"grad_norm": 0.653905616156312,
"learning_rate": 2.7812059895402064e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29623761773109436,
"step": 1880,
"valid_targets_mean": 3166.4,
"valid_targets_min": 1436
},
{
"epoch": 3.055105348460292,
"grad_norm": 0.6290299885338436,
"learning_rate": 2.773759388747925e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2997327446937561,
"step": 1885,
"valid_targets_mean": 4197.2,
"valid_targets_min": 1205
},
{
"epoch": 3.0632090761750406,
"grad_norm": 0.6799966773570919,
"learning_rate": 2.7663001517695386e-05,
"loss": 0.295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31888049840927124,
"step": 1890,
"valid_targets_mean": 3355.9,
"valid_targets_min": 765
},
{
"epoch": 3.0713128038897892,
"grad_norm": 0.6150196310708935,
"learning_rate": 2.7588284004210907e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2811214327812195,
"step": 1895,
"valid_targets_mean": 4364.9,
"valid_targets_min": 1049
},
{
"epoch": 3.079416531604538,
"grad_norm": 0.6290637964866943,
"learning_rate": 2.7513442567229936e-05,
"loss": 0.3593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3333356976509094,
"step": 1900,
"valid_targets_mean": 4037.9,
"valid_targets_min": 1237
},
{
"epoch": 3.087520259319287,
"grad_norm": 0.6693041785931817,
"learning_rate": 2.7438478428980407e-05,
"loss": 0.3229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3725960850715637,
"step": 1905,
"valid_targets_mean": 5818.6,
"valid_targets_min": 961
},
{
"epoch": 3.0956239870340356,
"grad_norm": 0.7196188613672898,
"learning_rate": 2.7363392813694047e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31832918524742126,
"step": 1910,
"valid_targets_mean": 3378.1,
"valid_targets_min": 1281
},
{
"epoch": 3.1037277147487843,
"grad_norm": 0.5818347922259423,
"learning_rate": 2.7288186947586426e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3344227075576782,
"step": 1915,
"valid_targets_mean": 4411.8,
"valid_targets_min": 1216
},
{
"epoch": 3.1118314424635334,
"grad_norm": 0.8446124163677976,
"learning_rate": 2.7212862058836925e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33817988634109497,
"step": 1920,
"valid_targets_mean": 2214.9,
"valid_targets_min": 975
},
{
"epoch": 3.119935170178282,
"grad_norm": 0.5779953469992928,
"learning_rate": 2.713741937756865e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.341831237077713,
"step": 1925,
"valid_targets_mean": 4742.4,
"valid_targets_min": 1109
},
{
"epoch": 3.1280388978930307,
"grad_norm": 0.6294273422868075,
"learning_rate": 2.7061860135828384e-05,
"loss": 0.3238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27781611680984497,
"step": 1930,
"valid_targets_mean": 3733.9,
"valid_targets_min": 943
},
{
"epoch": 3.1361426256077793,
"grad_norm": 0.6062050863467073,
"learning_rate": 2.6986185567566442e-05,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080408573150635,
"step": 1935,
"valid_targets_mean": 4087.9,
"valid_targets_min": 906
},
{
"epoch": 3.1442463533225284,
"grad_norm": 0.6952279897706104,
"learning_rate": 2.6910396908616527e-05,
"loss": 0.3299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3233116567134857,
"step": 1940,
"valid_targets_mean": 2762.6,
"valid_targets_min": 1176
},
{
"epoch": 3.152350081037277,
"grad_norm": 0.6787695116443276,
"learning_rate": 2.6834495396675526e-05,
"loss": 0.3359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3256149888038635,
"step": 1945,
"valid_targets_mean": 3157.2,
"valid_targets_min": 1514
},
{
"epoch": 3.1604538087520258,
"grad_norm": 1.1495419111797855,
"learning_rate": 2.6758482271283347e-05,
"loss": 0.354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3622073531150818,
"step": 1950,
"valid_targets_mean": 4490.8,
"valid_targets_min": 989
},
{
"epoch": 3.168557536466775,
"grad_norm": 0.5168346141282057,
"learning_rate": 2.668235877380263e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26513683795928955,
"step": 1955,
"valid_targets_mean": 4616.9,
"valid_targets_min": 1226
},
{
"epoch": 3.1766612641815235,
"grad_norm": 0.5043452872043703,
"learning_rate": 2.660612614739849e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28028619289398193,
"step": 1960,
"valid_targets_mean": 5325.6,
"valid_targets_min": 1168
},
{
"epoch": 3.184764991896272,
"grad_norm": 0.6906179138947607,
"learning_rate": 2.652978563701822e-05,
"loss": 0.3754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3693622946739197,
"step": 1965,
"valid_targets_mean": 3594.6,
"valid_targets_min": 796
},
{
"epoch": 3.1928687196110213,
"grad_norm": 0.49400430685078656,
"learning_rate": 2.645333848937095e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28254038095474243,
"step": 1970,
"valid_targets_mean": 6402.3,
"valid_targets_min": 942
},
{
"epoch": 3.20097244732577,
"grad_norm": 0.637834024266905,
"learning_rate": 2.6376785952907292e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2891494035720825,
"step": 1975,
"valid_targets_mean": 3953.7,
"valid_targets_min": 1532
},
{
"epoch": 3.2090761750405186,
"grad_norm": 0.7558584709666064,
"learning_rate": 2.630012927779896e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3705684542655945,
"step": 1980,
"valid_targets_mean": 3169.7,
"valid_targets_min": 1009
},
{
"epoch": 3.217179902755267,
"grad_norm": 0.7032258231926862,
"learning_rate": 2.6223369715918338e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3272814154624939,
"step": 1985,
"valid_targets_mean": 3970.0,
"valid_targets_min": 891
},
{
"epoch": 3.2252836304700163,
"grad_norm": 0.5503263411221311,
"learning_rate": 2.614650852081805e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31049543619155884,
"step": 1990,
"valid_targets_mean": 4652.0,
"valid_targets_min": 1039
},
{
"epoch": 3.233387358184765,
"grad_norm": 0.6450482534708121,
"learning_rate": 2.606954694771047e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3217643201351166,
"step": 1995,
"valid_targets_mean": 4368.6,
"valid_targets_min": 1147
},
{
"epoch": 3.2414910858995136,
"grad_norm": 0.6920112935131606,
"learning_rate": 2.5992486253447258e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3920653462409973,
"step": 2000,
"valid_targets_mean": 3602.1,
"valid_targets_min": 1061
},
{
"epoch": 3.2495948136142627,
"grad_norm": 0.5584795903285783,
"learning_rate": 2.5915327696498787e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3155994415283203,
"step": 2005,
"valid_targets_mean": 4913.4,
"valid_targets_min": 858
},
{
"epoch": 3.2576985413290114,
"grad_norm": 0.60509966416426,
"learning_rate": 2.583807253693362e-05,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28235840797424316,
"step": 2010,
"valid_targets_mean": 4147.4,
"valid_targets_min": 1456
},
{
"epoch": 3.26580226904376,
"grad_norm": 0.6062613453180128,
"learning_rate": 2.576072203639794e-05,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3725880980491638,
"step": 2015,
"valid_targets_mean": 4285.9,
"valid_targets_min": 1194
},
{
"epoch": 3.2739059967585087,
"grad_norm": 0.5738457995722336,
"learning_rate": 2.5683277458094926e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3272360563278198,
"step": 2020,
"valid_targets_mean": 4682.2,
"valid_targets_min": 1157
},
{
"epoch": 3.282009724473258,
"grad_norm": 0.8579473802204056,
"learning_rate": 2.560574006676413e-05,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3547009229660034,
"step": 2025,
"valid_targets_mean": 2234.7,
"valid_targets_min": 1192
},
{
"epoch": 3.2901134521880064,
"grad_norm": 0.6933220501836592,
"learning_rate": 2.5528111128660826e-05,
"loss": 0.3368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33494657278060913,
"step": 2030,
"valid_targets_mean": 3647.6,
"valid_targets_min": 1160
},
{
"epoch": 3.298217179902755,
"grad_norm": 0.7250423855085911,
"learning_rate": 2.545039191153533e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30072858929634094,
"step": 2035,
"valid_targets_mean": 2830.2,
"valid_targets_min": 752
},
{
"epoch": 3.306320907617504,
"grad_norm": 0.5630006709655807,
"learning_rate": 2.53725836846123e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2971174716949463,
"step": 2040,
"valid_targets_mean": 4642.2,
"valid_targets_min": 1261
},
{
"epoch": 3.314424635332253,
"grad_norm": 0.6837754571304738,
"learning_rate": 2.5294687718569994e-05,
"loss": 0.3488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29883715510368347,
"step": 2045,
"valid_targets_mean": 3184.2,
"valid_targets_min": 1064
},
{
"epoch": 3.3225283630470015,
"grad_norm": 0.6214125630303267,
"learning_rate": 2.5216705285519525e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303884357213974,
"step": 2050,
"valid_targets_mean": 4170.8,
"valid_targets_min": 1264
},
{
"epoch": 3.3306320907617506,
"grad_norm": 0.7065926173313246,
"learning_rate": 2.5138637658984116e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4543423056602478,
"step": 2055,
"valid_targets_mean": 4195.6,
"valid_targets_min": 1023
},
{
"epoch": 3.3387358184764993,
"grad_norm": 0.7035147409734731,
"learning_rate": 2.5060486113878244e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000071942806244,
"step": 2060,
"valid_targets_mean": 3148.4,
"valid_targets_min": 1195
},
{
"epoch": 3.346839546191248,
"grad_norm": 0.5664150065637116,
"learning_rate": 2.4982251926486873e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2577757239341736,
"step": 2065,
"valid_targets_mean": 3929.9,
"valid_targets_min": 1442
},
{
"epoch": 3.354943273905997,
"grad_norm": 0.6440217382239727,
"learning_rate": 2.490393637444458e-05,
"loss": 0.3241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3098256587982178,
"step": 2070,
"valid_targets_mean": 3736.5,
"valid_targets_min": 1467
},
{
"epoch": 3.3630470016207457,
"grad_norm": 0.601624816332684,
"learning_rate": 2.482554073671471e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29705819487571716,
"step": 2075,
"valid_targets_mean": 3976.4,
"valid_targets_min": 1256
},
{
"epoch": 3.3711507293354943,
"grad_norm": 0.6332684428153963,
"learning_rate": 2.4747066293568452e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34846431016921997,
"step": 2080,
"valid_targets_mean": 3731.8,
"valid_targets_min": 1267
},
{
"epoch": 3.379254457050243,
"grad_norm": 0.622824711033024,
"learning_rate": 2.4668514326564e-05,
"loss": 0.3304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3172885775566101,
"step": 2085,
"valid_targets_mean": 4841.5,
"valid_targets_min": 1281
},
{
"epoch": 3.387358184764992,
"grad_norm": 0.5756571432151757,
"learning_rate": 2.4589886118525556e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28297609090805054,
"step": 2090,
"valid_targets_mean": 4441.5,
"valid_targets_min": 1041
},
{
"epoch": 3.3954619124797407,
"grad_norm": 0.6063759657293902,
"learning_rate": 2.4511182953522405e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3448454737663269,
"step": 2095,
"valid_targets_mean": 4130.9,
"valid_targets_min": 1434
},
{
"epoch": 3.4035656401944894,
"grad_norm": 0.6837849754358483,
"learning_rate": 2.4432406116847954e-05,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4419548809528351,
"step": 2100,
"valid_targets_mean": 3970.8,
"valid_targets_min": 710
},
{
"epoch": 3.411669367909238,
"grad_norm": 0.7285501548199385,
"learning_rate": 2.435355689499874e-05,
"loss": 0.3489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3801971971988678,
"step": 2105,
"valid_targets_mean": 3257.1,
"valid_targets_min": 818
},
{
"epoch": 3.419773095623987,
"grad_norm": 0.6734064818131312,
"learning_rate": 2.4274636575653398e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3767085075378418,
"step": 2110,
"valid_targets_mean": 4296.2,
"valid_targets_min": 1145
},
{
"epoch": 3.427876823338736,
"grad_norm": 0.4899912083889619,
"learning_rate": 2.4195646447651663e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2573740482330322,
"step": 2115,
"valid_targets_mean": 5421.6,
"valid_targets_min": 1276
},
{
"epoch": 3.4359805510534844,
"grad_norm": 0.8302010528432883,
"learning_rate": 2.411658780097331e-05,
"loss": 0.3315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3501180410385132,
"step": 2120,
"valid_targets_mean": 5060.1,
"valid_targets_min": 1026
},
{
"epoch": 3.4440842787682335,
"grad_norm": 0.8078858491515395,
"learning_rate": 2.4037461926717075e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3591434955596924,
"step": 2125,
"valid_targets_mean": 2513.8,
"valid_targets_min": 1204
},
{
"epoch": 3.452188006482982,
"grad_norm": 0.7684258628541496,
"learning_rate": 2.395827011707959e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30334824323654175,
"step": 2130,
"valid_targets_mean": 3054.1,
"valid_targets_min": 1884
},
{
"epoch": 3.460291734197731,
"grad_norm": 0.605594191987749,
"learning_rate": 2.3879013665334258e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2900565564632416,
"step": 2135,
"valid_targets_mean": 4041.1,
"valid_targets_min": 1271
},
{
"epoch": 3.46839546191248,
"grad_norm": 0.8309685861439673,
"learning_rate": 2.3799693865810163e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37296062707901,
"step": 2140,
"valid_targets_mean": 4586.9,
"valid_targets_min": 1363
},
{
"epoch": 3.4764991896272286,
"grad_norm": 0.6551158353626602,
"learning_rate": 2.37203120138709e-05,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29635459184646606,
"step": 2145,
"valid_targets_mean": 3419.6,
"valid_targets_min": 905
},
{
"epoch": 3.4846029173419772,
"grad_norm": 0.6087540304186911,
"learning_rate": 2.3640869405893446e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3888489603996277,
"step": 2150,
"valid_targets_mean": 4710.4,
"valid_targets_min": 1216
},
{
"epoch": 3.492706645056726,
"grad_norm": 0.6512082633788822,
"learning_rate": 2.3561367339246976e-05,
"loss": 0.354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33419734239578247,
"step": 2155,
"valid_targets_mean": 4247.2,
"valid_targets_min": 1205
},
{
"epoch": 3.500810372771475,
"grad_norm": 0.6006332493640769,
"learning_rate": 2.3481807112271678e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28265705704689026,
"step": 2160,
"valid_targets_mean": 4532.8,
"valid_targets_min": 1355
},
{
"epoch": 3.5089141004862237,
"grad_norm": 0.6341470250528332,
"learning_rate": 2.3402190024257543e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3464913070201874,
"step": 2165,
"valid_targets_mean": 3982.2,
"valid_targets_min": 1030
},
{
"epoch": 3.5170178282009723,
"grad_norm": 0.49166553268855945,
"learning_rate": 2.3322517375423165e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3147142827510834,
"step": 2170,
"valid_targets_mean": 5943.0,
"valid_targets_min": 1166
},
{
"epoch": 3.525121555915721,
"grad_norm": 0.6416235508438507,
"learning_rate": 2.3242790466894494e-05,
"loss": 0.3379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3126268684864044,
"step": 2175,
"valid_targets_mean": 3601.8,
"valid_targets_min": 964
},
{
"epoch": 3.53322528363047,
"grad_norm": 0.7830076468989171,
"learning_rate": 2.316301060068359e-05,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30202680826187134,
"step": 2180,
"valid_targets_mean": 4094.8,
"valid_targets_min": 1174
},
{
"epoch": 3.5413290113452187,
"grad_norm": 0.5855369398506851,
"learning_rate": 2.3083179079667347e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29343757033348083,
"step": 2185,
"valid_targets_mean": 4782.4,
"valid_targets_min": 1087
},
{
"epoch": 3.5494327390599674,
"grad_norm": 0.7597815442570822,
"learning_rate": 2.300329720756625e-05,
"loss": 0.3539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3538168966770172,
"step": 2190,
"valid_targets_mean": 2795.9,
"valid_targets_min": 987
},
{
"epoch": 3.5575364667747165,
"grad_norm": 0.6412366872198969,
"learning_rate": 2.2923366288923045e-05,
"loss": 0.3495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34232521057128906,
"step": 2195,
"valid_targets_mean": 3828.8,
"valid_targets_min": 1162
},
{
"epoch": 3.565640194489465,
"grad_norm": 0.8572308035882495,
"learning_rate": 2.2843387629081453e-05,
"loss": 0.3201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34046727418899536,
"step": 2200,
"valid_targets_mean": 2780.4,
"valid_targets_min": 1118
},
{
"epoch": 3.5737439222042138,
"grad_norm": 0.8499753167098539,
"learning_rate": 2.2763362534164854e-05,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33723342418670654,
"step": 2205,
"valid_targets_mean": 4185.2,
"valid_targets_min": 1169
},
{
"epoch": 3.581847649918963,
"grad_norm": 0.6092208444164786,
"learning_rate": 2.268329231105498e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3268812596797943,
"step": 2210,
"valid_targets_mean": 4369.1,
"valid_targets_min": 1360
},
{
"epoch": 3.5899513776337115,
"grad_norm": 0.6149682556778238,
"learning_rate": 2.2603178267370504e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2967323958873749,
"step": 2215,
"valid_targets_mean": 3937.6,
"valid_targets_min": 974
},
{
"epoch": 3.59805510534846,
"grad_norm": 0.6136305917408219,
"learning_rate": 2.2523021711445746e-05,
"loss": 0.3271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32520681619644165,
"step": 2220,
"valid_targets_mean": 4224.8,
"valid_targets_min": 955
},
{
"epoch": 3.6061588330632093,
"grad_norm": 0.7678255502273676,
"learning_rate": 2.2442823952309308e-05,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37268686294555664,
"step": 2225,
"valid_targets_mean": 2761.6,
"valid_targets_min": 823
},
{
"epoch": 3.614262560777958,
"grad_norm": 0.6825494201612562,
"learning_rate": 2.2362586299662642e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30497026443481445,
"step": 2230,
"valid_targets_mean": 3246.8,
"valid_targets_min": 1196
},
{
"epoch": 3.6223662884927066,
"grad_norm": 0.7635839021679189,
"learning_rate": 2.228231006385873e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30430150032043457,
"step": 2235,
"valid_targets_mean": 3143.2,
"valid_targets_min": 1208
},
{
"epoch": 3.6304700162074557,
"grad_norm": 0.7017950535136555,
"learning_rate": 2.2201996555880633e-05,
"loss": 0.327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31477123498916626,
"step": 2240,
"valid_targets_mean": 3130.1,
"valid_targets_min": 1155
},
{
"epoch": 3.6385737439222043,
"grad_norm": 0.6932946086334288,
"learning_rate": 2.2121647087320105e-05,
"loss": 0.3548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31043219566345215,
"step": 2245,
"valid_targets_mean": 3812.2,
"valid_targets_min": 1364
},
{
"epoch": 3.646677471636953,
"grad_norm": 0.7548489669502686,
"learning_rate": 2.204126297035617e-05,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33928608894348145,
"step": 2250,
"valid_targets_mean": 3369.1,
"valid_targets_min": 1178
},
{
"epoch": 3.6547811993517016,
"grad_norm": 0.8476792319211851,
"learning_rate": 2.196084551773368e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.299949049949646,
"step": 2255,
"valid_targets_mean": 3624.9,
"valid_targets_min": 828
},
{
"epoch": 3.6628849270664503,
"grad_norm": 0.7748299471252531,
"learning_rate": 2.1880396042741906e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34626305103302,
"step": 2260,
"valid_targets_mean": 3092.2,
"valid_targets_min": 1019
},
{
"epoch": 3.6709886547811994,
"grad_norm": 0.6871604467560325,
"learning_rate": 2.179991585919307e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.348859965801239,
"step": 2265,
"valid_targets_mean": 3594.6,
"valid_targets_min": 1166
},
{
"epoch": 3.679092382495948,
"grad_norm": 0.5432953919737468,
"learning_rate": 2.1719406281400873e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26746731996536255,
"step": 2270,
"valid_targets_mean": 4830.1,
"valid_targets_min": 1507
},
{
"epoch": 3.6871961102106967,
"grad_norm": 0.5290458938160579,
"learning_rate": 2.163886862415908e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29459887742996216,
"step": 2275,
"valid_targets_mean": 5012.5,
"valid_targets_min": 1011
},
{
"epoch": 3.695299837925446,
"grad_norm": 0.7557537719911694,
"learning_rate": 2.155830420272e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3687734007835388,
"step": 2280,
"valid_targets_mean": 3272.9,
"valid_targets_min": 971
},
{
"epoch": 3.7034035656401945,
"grad_norm": 0.6329174750743987,
"learning_rate": 2.1477714332773022e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31322354078292847,
"step": 2285,
"valid_targets_mean": 4787.0,
"valid_targets_min": 1369
},
{
"epoch": 3.711507293354943,
"grad_norm": 0.6980753042204155,
"learning_rate": 2.139710033042314e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3370036482810974,
"step": 2290,
"valid_targets_mean": 3192.8,
"valid_targets_min": 1708
},
{
"epoch": 3.719611021069692,
"grad_norm": 0.5353150533110514,
"learning_rate": 2.1316463512169453e-05,
"loss": 0.329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2963425815105438,
"step": 2295,
"valid_targets_mean": 5346.8,
"valid_targets_min": 1110
},
{
"epoch": 3.727714748784441,
"grad_norm": 0.727354106763134,
"learning_rate": 2.1235805194883665e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3349874019622803,
"step": 2300,
"valid_targets_mean": 3280.2,
"valid_targets_min": 1314
},
{
"epoch": 3.7358184764991895,
"grad_norm": 0.5340590099482381,
"learning_rate": 2.115512669578857e-05,
"loss": 0.3387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3433595299720764,
"step": 2305,
"valid_targets_mean": 5857.9,
"valid_targets_min": 1335
},
{
"epoch": 3.7439222042139386,
"grad_norm": 0.6620119615821005,
"learning_rate": 2.107442933243656e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3657473623752594,
"step": 2310,
"valid_targets_mean": 3610.8,
"valid_targets_min": 1152
},
{
"epoch": 3.7520259319286873,
"grad_norm": 0.7166286016202882,
"learning_rate": 2.099371442268809e-05,
"loss": 0.3495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3325074017047882,
"step": 2315,
"valid_targets_mean": 3517.5,
"valid_targets_min": 1038
},
{
"epoch": 3.760129659643436,
"grad_norm": 0.4555518809686943,
"learning_rate": 2.0912983284690157e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2193748652935028,
"step": 2320,
"valid_targets_mean": 5561.4,
"valid_targets_min": 1239
},
{
"epoch": 3.768233387358185,
"grad_norm": 0.8753777799659089,
"learning_rate": 2.0832237236854794e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3095594644546509,
"step": 2325,
"valid_targets_mean": 3388.4,
"valid_targets_min": 1001
},
{
"epoch": 3.7763371150729337,
"grad_norm": 0.6884922798779087,
"learning_rate": 2.0751477597837528e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.335110604763031,
"step": 2330,
"valid_targets_mean": 3354.2,
"valid_targets_min": 1386
},
{
"epoch": 3.7844408427876823,
"grad_norm": 0.6332533539670777,
"learning_rate": 2.0670705686515822e-05,
"loss": 0.3299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30649179220199585,
"step": 2335,
"valid_targets_mean": 3949.0,
"valid_targets_min": 1135
},
{
"epoch": 3.792544570502431,
"grad_norm": 0.7717847306436155,
"learning_rate": 2.0589922821967566e-05,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37374433875083923,
"step": 2340,
"valid_targets_mean": 3164.6,
"valid_targets_min": 1119
},
{
"epoch": 3.8006482982171796,
"grad_norm": 0.6474397322416555,
"learning_rate": 2.0509130323449545e-05,
"loss": 0.3315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30513161420822144,
"step": 2345,
"valid_targets_mean": 3070.5,
"valid_targets_min": 933
},
{
"epoch": 3.8087520259319287,
"grad_norm": 0.5480983935201096,
"learning_rate": 2.0428329510375838e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291774183511734,
"step": 2350,
"valid_targets_mean": 5193.6,
"valid_targets_min": 1208
},
{
"epoch": 3.8168557536466774,
"grad_norm": 0.7833094014207244,
"learning_rate": 2.0347521702296333e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3558168113231659,
"step": 2355,
"valid_targets_mean": 2686.7,
"valid_targets_min": 1201
},
{
"epoch": 3.824959481361426,
"grad_norm": 0.7621050761785041,
"learning_rate": 2.026670821887516e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29817432165145874,
"step": 2360,
"valid_targets_mean": 2564.6,
"valid_targets_min": 628
},
{
"epoch": 3.833063209076175,
"grad_norm": 0.7337736559637801,
"learning_rate": 2.0185890379869115e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34583503007888794,
"step": 2365,
"valid_targets_mean": 3290.3,
"valid_targets_min": 1456
},
{
"epoch": 3.841166936790924,
"grad_norm": 0.6579044742309087,
"learning_rate": 2.0105069505106126e-05,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30498212575912476,
"step": 2370,
"valid_targets_mean": 3680.5,
"valid_targets_min": 1111
},
{
"epoch": 3.8492706645056725,
"grad_norm": 0.6122672425508787,
"learning_rate": 2.00242469144637e-05,
"loss": 0.3155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32759958505630493,
"step": 2375,
"valid_targets_mean": 4098.4,
"valid_targets_min": 1125
},
{
"epoch": 3.8573743922204216,
"grad_norm": 0.6522969245487142,
"learning_rate": 1.994342392784738e-05,
"loss": 0.3488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4506216049194336,
"step": 2380,
"valid_targets_mean": 4865.1,
"valid_targets_min": 1181
},
{
"epoch": 3.86547811993517,
"grad_norm": 0.8104573831758627,
"learning_rate": 1.9862601865169154e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3532731533050537,
"step": 2385,
"valid_targets_mean": 3282.5,
"valid_targets_min": 1020
},
{
"epoch": 3.873581847649919,
"grad_norm": 0.6575316647039278,
"learning_rate": 1.9781782046325938e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3369067311286926,
"step": 2390,
"valid_targets_mean": 3650.9,
"valid_targets_min": 1164
},
{
"epoch": 3.881685575364668,
"grad_norm": 1.0376247260450713,
"learning_rate": 1.9700965791177986e-05,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30998164415359497,
"step": 2395,
"valid_targets_mean": 4215.6,
"valid_targets_min": 1159
},
{
"epoch": 3.8897893030794166,
"grad_norm": 0.7122315974730362,
"learning_rate": 1.9620154419527372e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3429866135120392,
"step": 2400,
"valid_targets_mean": 3437.1,
"valid_targets_min": 959
},
{
"epoch": 3.8978930307941653,
"grad_norm": 0.5662001888178322,
"learning_rate": 1.953934925109641e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2822979986667633,
"step": 2405,
"valid_targets_mean": 4019.1,
"valid_targets_min": 733
},
{
"epoch": 3.9059967585089144,
"grad_norm": 0.8419287234640135,
"learning_rate": 1.945855160550611e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3056894838809967,
"step": 2410,
"valid_targets_mean": 4442.9,
"valid_targets_min": 1500
},
{
"epoch": 3.914100486223663,
"grad_norm": 0.6801232516837518,
"learning_rate": 1.937776280225463e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32119885087013245,
"step": 2415,
"valid_targets_mean": 3394.3,
"valid_targets_min": 985
},
{
"epoch": 3.9222042139384117,
"grad_norm": 0.6615050494532062,
"learning_rate": 1.929698416069571e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3271116018295288,
"step": 2420,
"valid_targets_mean": 3491.4,
"valid_targets_min": 1466
},
{
"epoch": 3.9303079416531603,
"grad_norm": 0.6480829850992813,
"learning_rate": 1.9216217000017182e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3169797658920288,
"step": 2425,
"valid_targets_mean": 3797.2,
"valid_targets_min": 1139
},
{
"epoch": 3.938411669367909,
"grad_norm": 0.6608189143051717,
"learning_rate": 1.9135462639219325e-05,
"loss": 0.3437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4551173448562622,
"step": 2430,
"valid_targets_mean": 4511.9,
"valid_targets_min": 1271
},
{
"epoch": 3.946515397082658,
"grad_norm": 0.6194102241113435,
"learning_rate": 1.905472239709343e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2990500330924988,
"step": 2435,
"valid_targets_mean": 4128.2,
"valid_targets_min": 741
},
{
"epoch": 3.9546191247974067,
"grad_norm": 0.5192772414872362,
"learning_rate": 1.89739975922002e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26180487871170044,
"step": 2440,
"valid_targets_mean": 5093.2,
"valid_targets_min": 1237
},
{
"epoch": 3.9627228525121554,
"grad_norm": 0.5316589878706719,
"learning_rate": 1.889328954284823e-05,
"loss": 0.3231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29911136627197266,
"step": 2445,
"valid_targets_mean": 5077.1,
"valid_targets_min": 1327
},
{
"epoch": 3.9708265802269045,
"grad_norm": 0.6003750397681551,
"learning_rate": 1.8812599567072496e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3472042977809906,
"step": 2450,
"valid_targets_mean": 4503.7,
"valid_targets_min": 1596
},
{
"epoch": 3.978930307941653,
"grad_norm": 0.6559987437310445,
"learning_rate": 1.873192898261281e-05,
"loss": 0.3465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3218577802181244,
"step": 2455,
"valid_targets_mean": 3607.2,
"valid_targets_min": 895
},
{
"epoch": 3.987034035656402,
"grad_norm": 0.6531204473773664,
"learning_rate": 1.8651279106892317e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3570401966571808,
"step": 2460,
"valid_targets_mean": 3725.1,
"valid_targets_min": 1448
},
{
"epoch": 3.995137763371151,
"grad_norm": 0.6130067904924766,
"learning_rate": 1.8570651256995933e-05,
"loss": 0.34,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30347344279289246,
"step": 2465,
"valid_targets_mean": 4397.4,
"valid_targets_min": 1067
},
{
"epoch": 4.003241491085899,
"grad_norm": 0.8400473811046529,
"learning_rate": 1.849004674964891e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37068480253219604,
"step": 2470,
"valid_targets_mean": 2330.9,
"valid_targets_min": 1330
},
{
"epoch": 4.011345218800648,
"grad_norm": 0.8209932869507489,
"learning_rate": 1.840946690119528e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3333631455898285,
"step": 2475,
"valid_targets_mean": 2441.2,
"valid_targets_min": 1213
},
{
"epoch": 4.019448946515397,
"grad_norm": 0.6924400519323498,
"learning_rate": 1.8328913027576373e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25744473934173584,
"step": 2480,
"valid_targets_mean": 3704.8,
"valid_targets_min": 1284
},
{
"epoch": 4.0275526742301455,
"grad_norm": 0.627014797979199,
"learning_rate": 1.824838644430934e-05,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2638548016548157,
"step": 2485,
"valid_targets_mean": 4240.4,
"valid_targets_min": 999
},
{
"epoch": 4.035656401944895,
"grad_norm": 0.6411695887560652,
"learning_rate": 1.8167888466465652e-05,
"loss": 0.3312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325685977935791,
"step": 2490,
"valid_targets_mean": 4314.9,
"valid_targets_min": 941
},
{
"epoch": 4.043760129659644,
"grad_norm": 0.7808679492122392,
"learning_rate": 1.8087420408649596e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3526899814605713,
"step": 2495,
"valid_targets_mean": 2995.1,
"valid_targets_min": 1278
},
{
"epoch": 4.051863857374392,
"grad_norm": 0.6650808996351736,
"learning_rate": 1.8006983584976877e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25968295335769653,
"step": 2500,
"valid_targets_mean": 3737.1,
"valid_targets_min": 1070
},
{
"epoch": 4.059967585089141,
"grad_norm": 0.6620959381335446,
"learning_rate": 1.7926579309053098e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.275592565536499,
"step": 2505,
"valid_targets_mean": 3844.2,
"valid_targets_min": 1386
},
{
"epoch": 4.06807131280389,
"grad_norm": 0.611981072438135,
"learning_rate": 1.7846208893952346e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791903614997864,
"step": 2510,
"valid_targets_mean": 4565.8,
"valid_targets_min": 1242
},
{
"epoch": 4.076175040518638,
"grad_norm": 0.6412358606975395,
"learning_rate": 1.7765873652195713e-05,
"loss": 0.3192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3951537609100342,
"step": 2515,
"valid_targets_mean": 4688.7,
"valid_targets_min": 837
},
{
"epoch": 4.084278768233387,
"grad_norm": 0.7188217457261792,
"learning_rate": 1.7685574895729886e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31020399928092957,
"step": 2520,
"valid_targets_mean": 3320.2,
"valid_targets_min": 823
},
{
"epoch": 4.0923824959481365,
"grad_norm": 0.6980680753937775,
"learning_rate": 1.7605313935905722e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31744128465652466,
"step": 2525,
"valid_targets_mean": 4232.6,
"valid_targets_min": 1243
},
{
"epoch": 4.100486223662885,
"grad_norm": 0.7692631551657655,
"learning_rate": 1.7525092083456795e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30562955141067505,
"step": 2530,
"valid_targets_mean": 2824.4,
"valid_targets_min": 1129
},
{
"epoch": 4.108589951377634,
"grad_norm": 0.8164264535125219,
"learning_rate": 1.744491064847805e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31630781292915344,
"step": 2535,
"valid_targets_mean": 2976.9,
"valid_targets_min": 865
},
{
"epoch": 4.116693679092383,
"grad_norm": 0.7838788568786066,
"learning_rate": 1.7364770940404375e-05,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557229995727539,
"step": 2540,
"valid_targets_mean": 3894.8,
"valid_targets_min": 1361
},
{
"epoch": 4.124797406807131,
"grad_norm": 0.6054279363053395,
"learning_rate": 1.7284674267989213e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26003241539001465,
"step": 2545,
"valid_targets_mean": 4236.4,
"valid_targets_min": 1023
},
{
"epoch": 4.13290113452188,
"grad_norm": 0.6753456498802832,
"learning_rate": 1.72046219392832e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3229011297225952,
"step": 2550,
"valid_targets_mean": 3918.2,
"valid_targets_min": 1319
},
{
"epoch": 4.1410048622366284,
"grad_norm": 0.9066318534345271,
"learning_rate": 1.712461526161279e-05,
"loss": 0.3346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3370896577835083,
"step": 2555,
"valid_targets_mean": 3921.2,
"valid_targets_min": 684
},
{
"epoch": 4.1491085899513775,
"grad_norm": 0.6943027908207531,
"learning_rate": 1.7044655541558934e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36387622356414795,
"step": 2560,
"valid_targets_mean": 3734.2,
"valid_targets_min": 1098
},
{
"epoch": 4.157212317666127,
"grad_norm": 0.6280793763976201,
"learning_rate": 1.69647440849357e-05,
"loss": 0.3334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29390856623649597,
"step": 2565,
"valid_targets_mean": 4059.8,
"valid_targets_min": 1173
},
{
"epoch": 4.165316045380875,
"grad_norm": 0.8652306023704479,
"learning_rate": 1.6884882196768985e-05,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.351234495639801,
"step": 2570,
"valid_targets_mean": 2524.9,
"valid_targets_min": 1160
},
{
"epoch": 4.173419773095624,
"grad_norm": 0.6507876691877541,
"learning_rate": 1.680507118127518e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2786210775375366,
"step": 2575,
"valid_targets_mean": 4142.7,
"valid_targets_min": 1027
},
{
"epoch": 4.181523500810373,
"grad_norm": 0.4778265253290313,
"learning_rate": 1.6725312341839895e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3144574463367462,
"step": 2580,
"valid_targets_mean": 7203.1,
"valid_targets_min": 1984
},
{
"epoch": 4.189627228525121,
"grad_norm": 0.7392662761852493,
"learning_rate": 1.664560698099664e-05,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28497248888015747,
"step": 2585,
"valid_targets_mean": 2962.3,
"valid_targets_min": 1237
},
{
"epoch": 4.19773095623987,
"grad_norm": 0.6112256034306288,
"learning_rate": 1.6565956400405586e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2852174639701843,
"step": 2590,
"valid_targets_mean": 4563.4,
"valid_targets_min": 995
},
{
"epoch": 4.2058346839546195,
"grad_norm": 0.796163466102447,
"learning_rate": 1.6486361900832284e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3211726248264313,
"step": 2595,
"valid_targets_mean": 3132.4,
"valid_targets_min": 805
},
{
"epoch": 4.213938411669368,
"grad_norm": 1.3208522637127655,
"learning_rate": 1.6406824782126428e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30766162276268005,
"step": 2600,
"valid_targets_mean": 3026.2,
"valid_targets_min": 1100
},
{
"epoch": 4.222042139384117,
"grad_norm": 0.8272038623649756,
"learning_rate": 1.632734634320064e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30653703212738037,
"step": 2605,
"valid_targets_mean": 2404.6,
"valid_targets_min": 1100
},
{
"epoch": 4.230145867098866,
"grad_norm": 0.7401433175255077,
"learning_rate": 1.6247927882009256e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266494482755661,
"step": 2610,
"valid_targets_mean": 3482.1,
"valid_targets_min": 1333
},
{
"epoch": 4.238249594813614,
"grad_norm": 0.7195940311079241,
"learning_rate": 1.6168570695527096e-05,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40879541635513306,
"step": 2615,
"valid_targets_mean": 4103.9,
"valid_targets_min": 970
},
{
"epoch": 4.246353322528363,
"grad_norm": 0.6953987582503965,
"learning_rate": 1.6089276079728334e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2825435698032379,
"step": 2620,
"valid_targets_mean": 3658.1,
"valid_targets_min": 1149
},
{
"epoch": 4.254457050243111,
"grad_norm": 0.7884023109909745,
"learning_rate": 1.6010045329565294e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29981517791748047,
"step": 2625,
"valid_targets_mean": 2593.6,
"valid_targets_min": 1171
},
{
"epoch": 4.2625607779578605,
"grad_norm": 0.878488278755131,
"learning_rate": 1.5930879738947328e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3167850971221924,
"step": 2630,
"valid_targets_mean": 2434.6,
"valid_targets_min": 983
},
{
"epoch": 4.27066450567261,
"grad_norm": 0.6394432218196988,
"learning_rate": 1.585178060071966e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784843146800995,
"step": 2635,
"valid_targets_mean": 4280.8,
"valid_targets_min": 1001
},
{
"epoch": 4.278768233387358,
"grad_norm": 0.5920424009782541,
"learning_rate": 1.5772749206642296e-05,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2522963285446167,
"step": 2640,
"valid_targets_mean": 4178.9,
"valid_targets_min": 1028
},
{
"epoch": 4.286871961102107,
"grad_norm": 0.5768126619167596,
"learning_rate": 1.5693786847368918e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2204509675502777,
"step": 2645,
"valid_targets_mean": 4170.9,
"valid_targets_min": 1110
},
{
"epoch": 4.294975688816856,
"grad_norm": 0.6628529323864057,
"learning_rate": 1.5614894812425806e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.273931622505188,
"step": 2650,
"valid_targets_mean": 3944.0,
"valid_targets_min": 1176
},
{
"epoch": 4.303079416531604,
"grad_norm": 0.6807384959247684,
"learning_rate": 1.5536074390190786e-05,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29452162981033325,
"step": 2655,
"valid_targets_mean": 4216.1,
"valid_targets_min": 996
},
{
"epoch": 4.311183144246353,
"grad_norm": 0.7186908503646409,
"learning_rate": 1.5457326867872177e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305240273475647,
"step": 2660,
"valid_targets_mean": 3643.4,
"valid_targets_min": 979
},
{
"epoch": 4.319286871961102,
"grad_norm": 0.6108649365109375,
"learning_rate": 1.5378653531487784e-05,
"loss": 0.3095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870018780231476,
"step": 2665,
"valid_targets_mean": 4265.2,
"valid_targets_min": 1149
},
{
"epoch": 4.327390599675851,
"grad_norm": 0.5974723937021044,
"learning_rate": 1.5300055665843875e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2622985243797302,
"step": 2670,
"valid_targets_mean": 4460.7,
"valid_targets_min": 1098
},
{
"epoch": 4.3354943273906,
"grad_norm": 0.813553355020424,
"learning_rate": 1.5221534554514225e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31859850883483887,
"step": 2675,
"valid_targets_mean": 2785.9,
"valid_targets_min": 906
},
{
"epoch": 4.343598055105349,
"grad_norm": 0.6516710233193221,
"learning_rate": 1.5143091479819146e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2503086030483246,
"step": 2680,
"valid_targets_mean": 3712.2,
"valid_targets_min": 1218
},
{
"epoch": 4.351701782820097,
"grad_norm": 0.6614846672676474,
"learning_rate": 1.5064727722804531e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2952650785446167,
"step": 2685,
"valid_targets_mean": 3959.1,
"valid_targets_min": 1150
},
{
"epoch": 4.359805510534846,
"grad_norm": 0.596297231951026,
"learning_rate": 1.4986444563220948e-05,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3439939022064209,
"step": 2690,
"valid_targets_mean": 4940.2,
"valid_targets_min": 1332
},
{
"epoch": 4.367909238249595,
"grad_norm": 0.5643409274980202,
"learning_rate": 1.4908243279502741e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3852804899215698,
"step": 2695,
"valid_targets_mean": 5347.9,
"valid_targets_min": 1164
},
{
"epoch": 4.376012965964343,
"grad_norm": 0.7304625760670628,
"learning_rate": 1.4830125148747138e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31127190589904785,
"step": 2700,
"valid_targets_mean": 4680.9,
"valid_targets_min": 999
},
{
"epoch": 4.3841166936790925,
"grad_norm": 0.6640526144672068,
"learning_rate": 1.475209144669341e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26242735981941223,
"step": 2705,
"valid_targets_mean": 3676.2,
"valid_targets_min": 969
},
{
"epoch": 4.392220421393841,
"grad_norm": 0.8292112236286381,
"learning_rate": 1.4674143447702036e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29638242721557617,
"step": 2710,
"valid_targets_mean": 2692.6,
"valid_targets_min": 351
},
{
"epoch": 4.40032414910859,
"grad_norm": 0.6417348703212333,
"learning_rate": 1.4596282424733877e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2617226839065552,
"step": 2715,
"valid_targets_mean": 3868.3,
"valid_targets_min": 1093
},
{
"epoch": 4.408427876823339,
"grad_norm": 0.7926194067640823,
"learning_rate": 1.4518509649329406e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2919907569885254,
"step": 2720,
"valid_targets_mean": 2726.9,
"valid_targets_min": 1215
},
{
"epoch": 4.416531604538087,
"grad_norm": 0.7677690933979908,
"learning_rate": 1.4440826391587926e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30967211723327637,
"step": 2725,
"valid_targets_mean": 3164.4,
"valid_targets_min": 1702
},
{
"epoch": 4.424635332252836,
"grad_norm": 0.7635518361684928,
"learning_rate": 1.4363233920146855e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31172192096710205,
"step": 2730,
"valid_targets_mean": 3045.9,
"valid_targets_min": 1326
},
{
"epoch": 4.432739059967585,
"grad_norm": 0.5954227022352406,
"learning_rate": 1.4285733502160955e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26830658316612244,
"step": 2735,
"valid_targets_mean": 4789.5,
"valid_targets_min": 311
},
{
"epoch": 4.4408427876823335,
"grad_norm": 0.5961589587008379,
"learning_rate": 1.4208326403281702e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3103683888912201,
"step": 2740,
"valid_targets_mean": 4827.6,
"valid_targets_min": 1115
},
{
"epoch": 4.448946515397083,
"grad_norm": 0.5974178836414327,
"learning_rate": 1.4131013887636576e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3044317364692688,
"step": 2745,
"valid_targets_mean": 4834.2,
"valid_targets_min": 890
},
{
"epoch": 4.457050243111832,
"grad_norm": 0.5924507972312091,
"learning_rate": 1.4053797217808432e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23466259241104126,
"step": 2750,
"valid_targets_mean": 4736.9,
"valid_targets_min": 1096
},
{
"epoch": 4.46515397082658,
"grad_norm": 0.7050432170850669,
"learning_rate": 1.3976677654814866e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3333389461040497,
"step": 2755,
"valid_targets_mean": 3746.6,
"valid_targets_min": 1264
},
{
"epoch": 4.473257698541329,
"grad_norm": 0.625082671183627,
"learning_rate": 1.3899656458087647e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26414743065834045,
"step": 2760,
"valid_targets_mean": 4043.4,
"valid_targets_min": 1157
},
{
"epoch": 4.481361426256078,
"grad_norm": 0.6545938419305839,
"learning_rate": 1.3822734885452136e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26352810859680176,
"step": 2765,
"valid_targets_mean": 3948.2,
"valid_targets_min": 906
},
{
"epoch": 4.489465153970826,
"grad_norm": 0.5856504955272438,
"learning_rate": 1.3745914193106715e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534196972846985,
"step": 2770,
"valid_targets_mean": 4745.9,
"valid_targets_min": 1245
},
{
"epoch": 4.4975688816855754,
"grad_norm": 0.6637431157492306,
"learning_rate": 1.366919563560233e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28753918409347534,
"step": 2775,
"valid_targets_mean": 4114.1,
"valid_targets_min": 628
},
{
"epoch": 4.5056726094003245,
"grad_norm": 0.5874971907386854,
"learning_rate": 1.3592580465821956e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26772981882095337,
"step": 2780,
"valid_targets_mean": 4026.8,
"valid_targets_min": 1021
},
{
"epoch": 4.513776337115073,
"grad_norm": 0.7407905359047069,
"learning_rate": 1.3516069934960174e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3074095845222473,
"step": 2785,
"valid_targets_mean": 3382.6,
"valid_targets_min": 1153
},
{
"epoch": 4.521880064829822,
"grad_norm": 0.6700473537828823,
"learning_rate": 1.3439665292502695e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3244781494140625,
"step": 2790,
"valid_targets_mean": 3940.2,
"valid_targets_min": 1105
},
{
"epoch": 4.52998379254457,
"grad_norm": 1.055189769478214,
"learning_rate": 1.3363367786205985e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33718210458755493,
"step": 2795,
"valid_targets_mean": 3863.8,
"valid_targets_min": 1728
},
{
"epoch": 4.538087520259319,
"grad_norm": 0.7112409148556906,
"learning_rate": 1.3287178662076893e-05,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3041728138923645,
"step": 2800,
"valid_targets_mean": 3700.9,
"valid_targets_min": 1333
},
{
"epoch": 4.546191247974068,
"grad_norm": 0.7156076125028735,
"learning_rate": 1.3211099164352261e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3130621016025543,
"step": 2805,
"valid_targets_mean": 3578.9,
"valid_targets_min": 1106
},
{
"epoch": 4.5542949756888165,
"grad_norm": 0.8719843408287105,
"learning_rate": 1.3135130535478655e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32647475600242615,
"step": 2810,
"valid_targets_mean": 2229.1,
"valid_targets_min": 1139
},
{
"epoch": 4.562398703403566,
"grad_norm": 0.6029727322953958,
"learning_rate": 1.3059274016092057e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911962568759918,
"step": 2815,
"valid_targets_mean": 4290.5,
"valid_targets_min": 1470
},
{
"epoch": 4.570502431118315,
"grad_norm": 0.5961063625812331,
"learning_rate": 1.2983530844997585e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26468124985694885,
"step": 2820,
"valid_targets_mean": 4589.2,
"valid_targets_min": 1347
},
{
"epoch": 4.578606158833063,
"grad_norm": 0.5660573404796354,
"learning_rate": 1.2907902259149287e-05,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2578660249710083,
"step": 2825,
"valid_targets_mean": 4920.9,
"valid_targets_min": 1288
},
{
"epoch": 4.586709886547812,
"grad_norm": 0.7280963642347,
"learning_rate": 1.2832389493629928e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32471543550491333,
"step": 2830,
"valid_targets_mean": 3581.1,
"valid_targets_min": 1017
},
{
"epoch": 4.594813614262561,
"grad_norm": 0.715412432811769,
"learning_rate": 1.275699378163083e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28921806812286377,
"step": 2835,
"valid_targets_mean": 3497.8,
"valid_targets_min": 1320
},
{
"epoch": 4.602917341977309,
"grad_norm": 0.6532672996527726,
"learning_rate": 1.2681716354431704e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32215386629104614,
"step": 2840,
"valid_targets_mean": 4033.8,
"valid_targets_min": 749
},
{
"epoch": 4.611021069692058,
"grad_norm": 0.8260191084875083,
"learning_rate": 1.2606558441380587e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32344701886177063,
"step": 2845,
"valid_targets_mean": 3283.2,
"valid_targets_min": 1043
},
{
"epoch": 4.6191247974068075,
"grad_norm": 0.6939779814125713,
"learning_rate": 1.2531521269873736e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27716442942619324,
"step": 2850,
"valid_targets_mean": 3567.2,
"valid_targets_min": 1014
},
{
"epoch": 4.627228525121556,
"grad_norm": 0.792117184497524,
"learning_rate": 1.245660606533559e-05,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3006155490875244,
"step": 2855,
"valid_targets_mean": 2872.9,
"valid_targets_min": 887
},
{
"epoch": 4.635332252836305,
"grad_norm": 1.4604402166637813,
"learning_rate": 1.2381814051198751e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2872532606124878,
"step": 2860,
"valid_targets_mean": 3158.4,
"valid_targets_min": 1152
},
{
"epoch": 4.643435980551054,
"grad_norm": 0.7254348350390687,
"learning_rate": 1.2307146448884021e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911936044692993,
"step": 2865,
"valid_targets_mean": 3529.8,
"valid_targets_min": 1246
},
{
"epoch": 4.651539708265802,
"grad_norm": 0.6614033286563541,
"learning_rate": 1.2232604477780445e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721143066883087,
"step": 2870,
"valid_targets_mean": 3971.7,
"valid_targets_min": 1283
},
{
"epoch": 4.659643435980551,
"grad_norm": 0.7213983514513054,
"learning_rate": 1.2158189355225382e-05,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28996139764785767,
"step": 2875,
"valid_targets_mean": 3356.2,
"valid_targets_min": 943
},
{
"epoch": 4.667747163695299,
"grad_norm": 0.5944666004073663,
"learning_rate": 1.2083902296484659e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28627628087997437,
"step": 2880,
"valid_targets_mean": 5012.4,
"valid_targets_min": 1118
},
{
"epoch": 4.6758508914100485,
"grad_norm": 0.6862135372991642,
"learning_rate": 1.2009744514732698e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3100573420524597,
"step": 2885,
"valid_targets_mean": 3498.6,
"valid_targets_min": 1077
},
{
"epoch": 4.683954619124798,
"grad_norm": 0.5823076416457025,
"learning_rate": 1.1935717221032707e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30757367610931396,
"step": 2890,
"valid_targets_mean": 4603.4,
"valid_targets_min": 1196
},
{
"epoch": 4.692058346839546,
"grad_norm": 0.6566892716189943,
"learning_rate": 1.1861821624316916e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3225197196006775,
"step": 2895,
"valid_targets_mean": 3725.3,
"valid_targets_min": 1058
},
{
"epoch": 4.700162074554295,
"grad_norm": 0.6976236384286916,
"learning_rate": 1.1788058931366822e-05,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4578794240951538,
"step": 2900,
"valid_targets_mean": 4013.0,
"valid_targets_min": 1016
},
{
"epoch": 4.708265802269044,
"grad_norm": 0.823649732616322,
"learning_rate": 1.1714430346793479e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31944727897644043,
"step": 2905,
"valid_targets_mean": 2667.8,
"valid_targets_min": 1009
},
{
"epoch": 4.716369529983792,
"grad_norm": 0.6038110363670156,
"learning_rate": 1.1640937073017837e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2808373272418976,
"step": 2910,
"valid_targets_mean": 4206.1,
"valid_targets_min": 1537
},
{
"epoch": 4.724473257698541,
"grad_norm": 0.5706371680859499,
"learning_rate": 1.1567580310251097e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29434657096862793,
"step": 2915,
"valid_targets_mean": 5014.4,
"valid_targets_min": 1214
},
{
"epoch": 4.73257698541329,
"grad_norm": 0.7418205606965962,
"learning_rate": 1.1494361256475105e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3157218098640442,
"step": 2920,
"valid_targets_mean": 3176.5,
"valid_targets_min": 1332
},
{
"epoch": 4.740680713128039,
"grad_norm": 0.5164826345529684,
"learning_rate": 1.1421281107422804e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2267780900001526,
"step": 2925,
"valid_targets_mean": 5747.8,
"valid_targets_min": 1101
},
{
"epoch": 4.748784440842788,
"grad_norm": 0.7545936872796103,
"learning_rate": 1.1348341056558709e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2719404697418213,
"step": 2930,
"valid_targets_mean": 3002.6,
"valid_targets_min": 1058
},
{
"epoch": 4.756888168557537,
"grad_norm": 0.6208311308778571,
"learning_rate": 1.1275542295059384e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3292774558067322,
"step": 2935,
"valid_targets_mean": 4970.6,
"valid_targets_min": 1138
},
{
"epoch": 4.764991896272285,
"grad_norm": 0.6019183667184134,
"learning_rate": 1.1202886011794023e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3418167233467102,
"step": 2940,
"valid_targets_mean": 4616.4,
"valid_targets_min": 1057
},
{
"epoch": 4.773095623987034,
"grad_norm": 0.85052165270995,
"learning_rate": 1.1130373393305004e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2802833914756775,
"step": 2945,
"valid_targets_mean": 4332.2,
"valid_targets_min": 1019
},
{
"epoch": 4.781199351701783,
"grad_norm": 0.7917179246807688,
"learning_rate": 1.1058005623788564e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122570514678955,
"step": 2950,
"valid_targets_mean": 3426.0,
"valid_targets_min": 972
},
{
"epoch": 4.789303079416531,
"grad_norm": 0.7139017191012962,
"learning_rate": 1.0985783885075407e-05,
"loss": 0.313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289265513420105,
"step": 2955,
"valid_targets_mean": 3680.8,
"valid_targets_min": 1375
},
{
"epoch": 4.7974068071312805,
"grad_norm": 0.8032957029552218,
"learning_rate": 1.0913709356611411e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865556478500366,
"step": 2960,
"valid_targets_mean": 2568.1,
"valid_targets_min": 607
},
{
"epoch": 4.805510534846029,
"grad_norm": 0.7258218597446954,
"learning_rate": 1.0841783215438406e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27492740750312805,
"step": 2965,
"valid_targets_mean": 3073.8,
"valid_targets_min": 1155
},
{
"epoch": 4.813614262560778,
"grad_norm": 0.9231645223463597,
"learning_rate": 1.07700066361749e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2736729085445404,
"step": 2970,
"valid_targets_mean": 4219.8,
"valid_targets_min": 1500
},
{
"epoch": 4.821717990275527,
"grad_norm": 0.7204809432667069,
"learning_rate": 1.0698380790996921e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4039513170719147,
"step": 2975,
"valid_targets_mean": 3791.6,
"valid_targets_min": 988
},
{
"epoch": 4.829821717990275,
"grad_norm": 0.7355419119699267,
"learning_rate": 1.0626906849618903e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32579725980758667,
"step": 2980,
"valid_targets_mean": 3853.4,
"valid_targets_min": 1194
},
{
"epoch": 4.837925445705024,
"grad_norm": 0.6872894810537605,
"learning_rate": 1.0555585979274513e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2627268433570862,
"step": 2985,
"valid_targets_mean": 3120.8,
"valid_targets_min": 1194
},
{
"epoch": 4.846029173419773,
"grad_norm": 0.6320865135995328,
"learning_rate": 1.0484419344697667e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33812516927719116,
"step": 2990,
"valid_targets_mean": 4165.2,
"valid_targets_min": 1044
},
{
"epoch": 4.854132901134522,
"grad_norm": 0.6525207154113098,
"learning_rate": 1.0413408108103445e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672692537307739,
"step": 2995,
"valid_targets_mean": 3958.0,
"valid_targets_min": 752
},
{
"epoch": 4.862236628849271,
"grad_norm": 0.7324504070792344,
"learning_rate": 1.0342553429169163e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.308619886636734,
"step": 3000,
"valid_targets_mean": 3301.4,
"valid_targets_min": 720
},
{
"epoch": 4.87034035656402,
"grad_norm": 0.7729266863011056,
"learning_rate": 1.0271856465015388e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953605055809021,
"step": 3005,
"valid_targets_mean": 3670.2,
"valid_targets_min": 1511
},
{
"epoch": 4.878444084278768,
"grad_norm": 0.6049298397937694,
"learning_rate": 1.0201318370187065e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28800350427627563,
"step": 3010,
"valid_targets_mean": 4787.6,
"valid_targets_min": 1243
},
{
"epoch": 4.886547811993517,
"grad_norm": 0.7118664172339165,
"learning_rate": 1.0130940296634683e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31415632367134094,
"step": 3015,
"valid_targets_mean": 3257.8,
"valid_targets_min": 1108
},
{
"epoch": 4.894651539708266,
"grad_norm": 0.5531509637033187,
"learning_rate": 1.0060723393695411e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28131812810897827,
"step": 3020,
"valid_targets_mean": 4997.1,
"valid_targets_min": 1727
},
{
"epoch": 4.902755267423014,
"grad_norm": 0.5338020186024223,
"learning_rate": 9.990668808074378e-06,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28649789094924927,
"step": 3025,
"valid_targets_mean": 5955.0,
"valid_targets_min": 1806
},
{
"epoch": 4.9108589951377635,
"grad_norm": 0.7028420105154684,
"learning_rate": 9.920777683825906e-06,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2879384756088257,
"step": 3030,
"valid_targets_mean": 3591.8,
"valid_targets_min": 1963
},
{
"epoch": 4.918962722852513,
"grad_norm": 0.7304701576538732,
"learning_rate": 9.851051162334871e-06,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3374594449996948,
"step": 3035,
"valid_targets_mean": 3193.5,
"valid_targets_min": 863
},
{
"epoch": 4.927066450567261,
"grad_norm": 0.5865752240512088,
"learning_rate": 9.781490382298018e-06,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32436108589172363,
"step": 3040,
"valid_targets_mean": 4995.1,
"valid_targets_min": 1006
},
{
"epoch": 4.93517017828201,
"grad_norm": 0.8489788664414895,
"learning_rate": 9.712096479705382e-06,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3596591055393219,
"step": 3045,
"valid_targets_mean": 2581.2,
"valid_targets_min": 260
},
{
"epoch": 4.943273905996758,
"grad_norm": 0.6007400071384102,
"learning_rate": 9.642870587821761e-06,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2724454700946808,
"step": 3050,
"valid_targets_mean": 4420.8,
"valid_targets_min": 992
},
{
"epoch": 4.951377633711507,
"grad_norm": 0.7265588407960974,
"learning_rate": 9.573813837168166e-06,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30277544260025024,
"step": 3055,
"valid_targets_mean": 3065.9,
"valid_targets_min": 862
},
{
"epoch": 4.959481361426256,
"grad_norm": 0.7253607975993981,
"learning_rate": 9.504927355503399e-06,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33545592427253723,
"step": 3060,
"valid_targets_mean": 3197.4,
"valid_targets_min": 1275
},
{
"epoch": 4.9675850891410045,
"grad_norm": 0.6715975787612942,
"learning_rate": 9.436212267805591e-06,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28574198484420776,
"step": 3065,
"valid_targets_mean": 3559.9,
"valid_targets_min": 1152
},
{
"epoch": 4.975688816855754,
"grad_norm": 0.6147947824290071,
"learning_rate": 9.367669696253885e-06,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3622044324874878,
"step": 3070,
"valid_targets_mean": 5026.7,
"valid_targets_min": 829
},
{
"epoch": 4.983792544570503,
"grad_norm": 0.9266146599676338,
"learning_rate": 9.299300760210059e-06,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25320684909820557,
"step": 3075,
"valid_targets_mean": 5378.4,
"valid_targets_min": 1587
},
{
"epoch": 4.991896272285251,
"grad_norm": 0.886524861463812,
"learning_rate": 9.231106576200268e-06,
"loss": 0.3495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33286648988723755,
"step": 3080,
"valid_targets_mean": 2349.5,
"valid_targets_min": 769
},
{
"epoch": 5.0,
"grad_norm": 0.5637786613200365,
"learning_rate": 9.163088257896825e-06,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30712249875068665,
"step": 3085,
"valid_targets_mean": 5376.3,
"valid_targets_min": 1897
},
{
"epoch": 5.008103727714749,
"grad_norm": 0.679283516267655,
"learning_rate": 9.095246916099978e-06,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30201444029808044,
"step": 3090,
"valid_targets_mean": 3832.2,
"valid_targets_min": 1418
},
{
"epoch": 5.016207455429497,
"grad_norm": 0.7170611382488913,
"learning_rate": 9.027583658719812e-06,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2814018130302429,
"step": 3095,
"valid_targets_mean": 3344.4,
"valid_targets_min": 1012
},
{
"epoch": 5.024311183144246,
"grad_norm": 0.6078632668782452,
"learning_rate": 8.960099590758104e-06,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3396990895271301,
"step": 3100,
"valid_targets_mean": 5253.6,
"valid_targets_min": 1140
},
{
"epoch": 5.0324149108589955,
"grad_norm": 0.7835574782392883,
"learning_rate": 8.892795814290342e-06,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2960517406463623,
"step": 3105,
"valid_targets_mean": 3160.6,
"valid_targets_min": 1256
},
{
"epoch": 5.040518638573744,
"grad_norm": 0.7378400262878008,
"learning_rate": 8.825673428447668e-06,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2975686192512512,
"step": 3110,
"valid_targets_mean": 3756.3,
"valid_targets_min": 1114
},
{
"epoch": 5.048622366288493,
"grad_norm": 0.6887905386158489,
"learning_rate": 8.758733529398945e-06,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563658654689789,
"step": 3115,
"valid_targets_mean": 3989.8,
"valid_targets_min": 1070
},
{
"epoch": 5.056726094003242,
"grad_norm": 0.6618439575404061,
"learning_rate": 8.691977210332892e-06,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25922781229019165,
"step": 3120,
"valid_targets_mean": 4233.7,
"valid_targets_min": 898
},
{
"epoch": 5.06482982171799,
"grad_norm": 0.5650176047225448,
"learning_rate": 8.625405561440172e-06,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2414149045944214,
"step": 3125,
"valid_targets_mean": 4405.9,
"valid_targets_min": 344
},
{
"epoch": 5.072933549432739,
"grad_norm": 0.7330383005392311,
"learning_rate": 8.559019669895648e-06,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28208595514297485,
"step": 3130,
"valid_targets_mean": 3542.4,
"valid_targets_min": 969
},
{
"epoch": 5.081037277147487,
"grad_norm": 0.7265672842651938,
"learning_rate": 8.492820619840563e-06,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.256570041179657,
"step": 3135,
"valid_targets_mean": 4502.6,
"valid_targets_min": 1105
},
{
"epoch": 5.0891410048622365,
"grad_norm": 0.8957657482015896,
"learning_rate": 8.426809492364907e-06,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3049822449684143,
"step": 3140,
"valid_targets_mean": 2393.8,
"valid_targets_min": 752
},
{
"epoch": 5.097244732576986,
"grad_norm": 0.6466368422052554,
"learning_rate": 8.360987365489698e-06,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25956565141677856,
"step": 3145,
"valid_targets_mean": 4452.4,
"valid_targets_min": 463
},
{
"epoch": 5.105348460291734,
"grad_norm": 0.9077370475698178,
"learning_rate": 8.295355314149413e-06,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3483518362045288,
"step": 3150,
"valid_targets_mean": 2507.1,
"valid_targets_min": 863
},
{
"epoch": 5.113452188006483,
"grad_norm": 0.8110339444850555,
"learning_rate": 8.229914410174435e-06,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3136909008026123,
"step": 3155,
"valid_targets_mean": 2973.8,
"valid_targets_min": 800
},
{
"epoch": 5.121555915721232,
"grad_norm": 0.6807259870266567,
"learning_rate": 8.16466572227352e-06,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30755871534347534,
"step": 3160,
"valid_targets_mean": 3892.3,
"valid_targets_min": 1547
},
{
"epoch": 5.12965964343598,
"grad_norm": 0.658342938443184,
"learning_rate": 8.099610316016373e-06,
"loss": 0.2613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30165326595306396,
"step": 3165,
"valid_targets_mean": 4359.5,
"valid_targets_min": 1216
},
{
"epoch": 5.137763371150729,
"grad_norm": 0.9237059062611359,
"learning_rate": 8.03474925381625e-06,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3684241771697998,
"step": 3170,
"valid_targets_mean": 2736.1,
"valid_targets_min": 1269
},
{
"epoch": 5.145867098865478,
"grad_norm": 0.738400061019705,
"learning_rate": 7.97008359491257e-06,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29892492294311523,
"step": 3175,
"valid_targets_mean": 3671.7,
"valid_targets_min": 607
},
{
"epoch": 5.153970826580227,
"grad_norm": 0.653087724753744,
"learning_rate": 7.905614395353649e-06,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32275858521461487,
"step": 3180,
"valid_targets_mean": 4359.4,
"valid_targets_min": 1197
},
{
"epoch": 5.162074554294976,
"grad_norm": 0.7687704188424886,
"learning_rate": 7.841342707979442e-06,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669990062713623,
"step": 3185,
"valid_targets_mean": 3254.8,
"valid_targets_min": 1262
},
{
"epoch": 5.170178282009725,
"grad_norm": 0.6145652140558867,
"learning_rate": 7.77726958240437e-06,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30221909284591675,
"step": 3190,
"valid_targets_mean": 4819.4,
"valid_targets_min": 998
},
{
"epoch": 5.178282009724473,
"grad_norm": 0.7821087325095586,
"learning_rate": 7.713396065000133e-06,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28741025924682617,
"step": 3195,
"valid_targets_mean": 3316.5,
"valid_targets_min": 937
},
{
"epoch": 5.186385737439222,
"grad_norm": 0.5251864451472283,
"learning_rate": 7.649723198878676e-06,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25311702489852905,
"step": 3200,
"valid_targets_mean": 5434.4,
"valid_targets_min": 1248
},
{
"epoch": 5.194489465153971,
"grad_norm": 0.7146340534365199,
"learning_rate": 7.586252023875125e-06,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2779831886291504,
"step": 3205,
"valid_targets_mean": 3548.5,
"valid_targets_min": 1142
},
{
"epoch": 5.2025931928687195,
"grad_norm": 0.6421920316889562,
"learning_rate": 7.522983576530791e-06,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2444455623626709,
"step": 3210,
"valid_targets_mean": 3775.6,
"valid_targets_min": 1018
},
{
"epoch": 5.210696920583469,
"grad_norm": 0.6085840752147157,
"learning_rate": 7.459918890076272e-06,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.286603718996048,
"step": 3215,
"valid_targets_mean": 5191.4,
"valid_targets_min": 1490
},
{
"epoch": 5.218800648298217,
"grad_norm": 0.682252527910381,
"learning_rate": 7.397058994414563e-06,
"loss": 0.2737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.283713698387146,
"step": 3220,
"valid_targets_mean": 4987.8,
"valid_targets_min": 1681
},
{
"epoch": 5.226904376012966,
"grad_norm": 0.761041867774423,
"learning_rate": 7.3344049161042495e-06,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30440282821655273,
"step": 3225,
"valid_targets_mean": 3551.4,
"valid_targets_min": 1016
},
{
"epoch": 5.235008103727715,
"grad_norm": 0.7457730095664243,
"learning_rate": 7.271957678342738e-06,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2805323898792267,
"step": 3230,
"valid_targets_mean": 3305.1,
"valid_targets_min": 296
},
{
"epoch": 5.243111831442463,
"grad_norm": 0.9269764600924907,
"learning_rate": 7.209718300949519e-06,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30809998512268066,
"step": 3235,
"valid_targets_mean": 3278.8,
"valid_targets_min": 974
},
{
"epoch": 5.251215559157212,
"grad_norm": 0.8608783945025844,
"learning_rate": 7.14768780034957e-06,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784419357776642,
"step": 3240,
"valid_targets_mean": 2483.4,
"valid_targets_min": 684
},
{
"epoch": 5.259319286871961,
"grad_norm": 0.6552635503057336,
"learning_rate": 7.085867189556697e-06,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24957261979579926,
"step": 3245,
"valid_targets_mean": 4670.8,
"valid_targets_min": 1095
},
{
"epoch": 5.26742301458671,
"grad_norm": 0.7567556315587354,
"learning_rate": 7.024257478157015e-06,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25506865978240967,
"step": 3250,
"valid_targets_mean": 2933.9,
"valid_targets_min": 813
},
{
"epoch": 5.275526742301459,
"grad_norm": 0.6500169004006787,
"learning_rate": 6.96285967229249e-06,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.285958856344223,
"step": 3255,
"valid_targets_mean": 4448.9,
"valid_targets_min": 1187
},
{
"epoch": 5.283630470016208,
"grad_norm": 0.8005728973226811,
"learning_rate": 6.901674774644449e-06,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28087589144706726,
"step": 3260,
"valid_targets_mean": 3049.1,
"valid_targets_min": 1160
},
{
"epoch": 5.291734197730956,
"grad_norm": 0.7675907087887824,
"learning_rate": 6.840703784417262e-06,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28006839752197266,
"step": 3265,
"valid_targets_mean": 3114.2,
"valid_targets_min": 1522
},
{
"epoch": 5.299837925445705,
"grad_norm": 0.6700312471419494,
"learning_rate": 6.779947697321974e-06,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.276754766702652,
"step": 3270,
"valid_targets_mean": 4571.8,
"valid_targets_min": 991
},
{
"epoch": 5.307941653160454,
"grad_norm": 0.7128592910951062,
"learning_rate": 6.719407505560094e-06,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31054553389549255,
"step": 3275,
"valid_targets_mean": 4182.4,
"valid_targets_min": 1339
},
{
"epoch": 5.316045380875202,
"grad_norm": 0.6512636677298553,
"learning_rate": 6.659084197807348e-06,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29994767904281616,
"step": 3280,
"valid_targets_mean": 4672.8,
"valid_targets_min": 938
},
{
"epoch": 5.3241491085899515,
"grad_norm": 0.7606762515888708,
"learning_rate": 6.598978759197554e-06,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2889411151409149,
"step": 3285,
"valid_targets_mean": 3447.2,
"valid_targets_min": 1074
},
{
"epoch": 5.332252836304701,
"grad_norm": 0.7089462941061058,
"learning_rate": 6.539092171306541e-06,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2591246962547302,
"step": 3290,
"valid_targets_mean": 3852.4,
"valid_targets_min": 1615
},
{
"epoch": 5.340356564019449,
"grad_norm": 0.793316654437433,
"learning_rate": 6.479425412136093e-06,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2555570602416992,
"step": 3295,
"valid_targets_mean": 2712.8,
"valid_targets_min": 1193
},
{
"epoch": 5.348460291734198,
"grad_norm": 0.8133606076526989,
"learning_rate": 6.419979456098016e-06,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27769023180007935,
"step": 3300,
"valid_targets_mean": 2869.2,
"valid_targets_min": 885
},
{
"epoch": 5.356564019448946,
"grad_norm": 0.6768085806436803,
"learning_rate": 6.360755273998174e-06,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2373725026845932,
"step": 3305,
"valid_targets_mean": 3990.9,
"valid_targets_min": 427
},
{
"epoch": 5.364667747163695,
"grad_norm": 0.8302998958250895,
"learning_rate": 6.301753833020691e-06,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31967538595199585,
"step": 3310,
"valid_targets_mean": 2772.0,
"valid_targets_min": 1170
},
{
"epoch": 5.372771474878444,
"grad_norm": 0.5943028036049409,
"learning_rate": 6.242976096712112e-06,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29758501052856445,
"step": 3315,
"valid_targets_mean": 5840.2,
"valid_targets_min": 349
},
{
"epoch": 5.3808752025931925,
"grad_norm": 0.7157345315365573,
"learning_rate": 6.18442302496568e-06,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25914475321769714,
"step": 3320,
"valid_targets_mean": 3808.9,
"valid_targets_min": 1101
},
{
"epoch": 5.388978930307942,
"grad_norm": 0.7786866822617113,
"learning_rate": 6.1260955740056835e-06,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894706130027771,
"step": 3325,
"valid_targets_mean": 3148.8,
"valid_targets_min": 1090
},
{
"epoch": 5.397082658022691,
"grad_norm": 0.76294737241064,
"learning_rate": 6.067994696371797e-06,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2689441442489624,
"step": 3330,
"valid_targets_mean": 3199.1,
"valid_targets_min": 403
},
{
"epoch": 5.405186385737439,
"grad_norm": 0.7624414240294302,
"learning_rate": 6.010121340903574e-06,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2649106979370117,
"step": 3335,
"valid_targets_mean": 3114.9,
"valid_targets_min": 1195
},
{
"epoch": 5.413290113452188,
"grad_norm": 0.701323992069574,
"learning_rate": 5.952476452724898e-06,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3416491448879242,
"step": 3340,
"valid_targets_mean": 4082.7,
"valid_targets_min": 1759
},
{
"epoch": 5.421393841166937,
"grad_norm": 0.742330773570171,
"learning_rate": 5.895060973228606e-06,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097589612007141,
"step": 3345,
"valid_targets_mean": 3322.2,
"valid_targets_min": 1518
},
{
"epoch": 5.429497568881685,
"grad_norm": 0.5877195535700861,
"learning_rate": 5.837875840061064e-06,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22878901660442352,
"step": 3350,
"valid_targets_mean": 4539.7,
"valid_targets_min": 1424
},
{
"epoch": 5.437601296596434,
"grad_norm": 0.6347647319563191,
"learning_rate": 5.780921987106878e-06,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23854267597198486,
"step": 3355,
"valid_targets_mean": 4752.8,
"valid_targets_min": 1023
},
{
"epoch": 5.4457050243111835,
"grad_norm": 0.8298002116959828,
"learning_rate": 5.724200344473651e-06,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27335381507873535,
"step": 3360,
"valid_targets_mean": 2939.4,
"valid_targets_min": 1065
},
{
"epoch": 5.453808752025932,
"grad_norm": 0.8280056823907535,
"learning_rate": 5.66771183847677e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28138309717178345,
"step": 3365,
"valid_targets_mean": 3459.2,
"valid_targets_min": 1159
},
{
"epoch": 5.461912479740681,
"grad_norm": 0.7652229448911942,
"learning_rate": 5.611457391624309e-06,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2577538788318634,
"step": 3370,
"valid_targets_mean": 3450.9,
"valid_targets_min": 1069
},
{
"epoch": 5.47001620745543,
"grad_norm": 0.7271629799488672,
"learning_rate": 5.555437922601918e-06,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2700653672218323,
"step": 3375,
"valid_targets_mean": 3632.2,
"valid_targets_min": 1087
},
{
"epoch": 5.478119935170178,
"grad_norm": 0.8700764884307809,
"learning_rate": 5.499654346257879e-06,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2594822645187378,
"step": 3380,
"valid_targets_mean": 4346.2,
"valid_targets_min": 1358
},
{
"epoch": 5.486223662884927,
"grad_norm": 0.770381419374314,
"learning_rate": 5.444107573588116e-06,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3069581985473633,
"step": 3385,
"valid_targets_mean": 4150.8,
"valid_targets_min": 1292
},
{
"epoch": 5.4943273905996755,
"grad_norm": 0.6696438750203964,
"learning_rate": 5.388798511721329e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23633962869644165,
"step": 3390,
"valid_targets_mean": 4223.9,
"valid_targets_min": 553
},
{
"epoch": 5.5024311183144246,
"grad_norm": 0.6855425861490273,
"learning_rate": 5.333728063904213e-06,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24334245920181274,
"step": 3395,
"valid_targets_mean": 3528.2,
"valid_targets_min": 1460
},
{
"epoch": 5.510534846029174,
"grad_norm": 0.786560444677125,
"learning_rate": 5.278897129486656e-06,
"loss": 0.3242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29019924998283386,
"step": 3400,
"valid_targets_mean": 3245.4,
"valid_targets_min": 1174
},
{
"epoch": 5.518638573743922,
"grad_norm": 0.7172670134554514,
"learning_rate": 5.224306603907095e-06,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28209179639816284,
"step": 3405,
"valid_targets_mean": 4107.5,
"valid_targets_min": 1070
},
{
"epoch": 5.526742301458671,
"grad_norm": 0.7350968379600731,
"learning_rate": 5.169957378677859e-06,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29147547483444214,
"step": 3410,
"valid_targets_mean": 3760.5,
"valid_targets_min": 1027
},
{
"epoch": 5.53484602917342,
"grad_norm": 0.7517239670767295,
"learning_rate": 5.11585034137064e-06,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884262800216675,
"step": 3415,
"valid_targets_mean": 3442.4,
"valid_targets_min": 1271
},
{
"epoch": 5.542949756888168,
"grad_norm": 0.9054713950721245,
"learning_rate": 5.061986375601977e-06,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.366168349981308,
"step": 3420,
"valid_targets_mean": 2817.2,
"valid_targets_min": 1101
},
{
"epoch": 5.551053484602917,
"grad_norm": 0.6501242905430781,
"learning_rate": 5.0083663610188215e-06,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24292755126953125,
"step": 3425,
"valid_targets_mean": 4625.0,
"valid_targets_min": 1485
},
{
"epoch": 5.5591572123176665,
"grad_norm": 1.4505012508960171,
"learning_rate": 4.954991173284207e-06,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867453694343567,
"step": 3430,
"valid_targets_mean": 3474.4,
"valid_targets_min": 1479
},
{
"epoch": 5.567260940032415,
"grad_norm": 0.8611869362587048,
"learning_rate": 4.901861684062899e-06,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303717702627182,
"step": 3435,
"valid_targets_mean": 2582.6,
"valid_targets_min": 1024
},
{
"epoch": 5.575364667747164,
"grad_norm": 0.6318517106242182,
"learning_rate": 4.848978761007206e-06,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35377246141433716,
"step": 3440,
"valid_targets_mean": 5696.1,
"valid_targets_min": 1209
},
{
"epoch": 5.583468395461912,
"grad_norm": 0.7580961353653848,
"learning_rate": 4.796343267742782e-06,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27109336853027344,
"step": 3445,
"valid_targets_mean": 3441.2,
"valid_targets_min": 1022
},
{
"epoch": 5.591572123176661,
"grad_norm": 0.8569431910573655,
"learning_rate": 4.743956063854529e-06,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3265492916107178,
"step": 3450,
"valid_targets_mean": 3613.4,
"valid_targets_min": 1007
},
{
"epoch": 5.59967585089141,
"grad_norm": 0.6785717564457475,
"learning_rate": 4.691818004872557e-06,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23201988637447357,
"step": 3455,
"valid_targets_mean": 3884.2,
"valid_targets_min": 1076
},
{
"epoch": 5.607779578606159,
"grad_norm": 1.5751988259842302,
"learning_rate": 4.639929942258217e-06,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24123671650886536,
"step": 3460,
"valid_targets_mean": 3035.5,
"valid_targets_min": 991
},
{
"epoch": 5.6158833063209075,
"grad_norm": 0.671534242940153,
"learning_rate": 4.588292723390204e-06,
"loss": 0.2613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23632174730300903,
"step": 3465,
"valid_targets_mean": 4311.9,
"valid_targets_min": 954
},
{
"epoch": 5.623987034035657,
"grad_norm": 0.6599509783390952,
"learning_rate": 4.536907191550694e-06,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2659260928630829,
"step": 3470,
"valid_targets_mean": 3626.4,
"valid_targets_min": 902
},
{
"epoch": 5.632090761750405,
"grad_norm": 0.8703140687361607,
"learning_rate": 4.4857741859116024e-06,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3029107451438904,
"step": 3475,
"valid_targets_mean": 2693.6,
"valid_targets_min": 971
},
{
"epoch": 5.640194489465154,
"grad_norm": 0.7936006609606302,
"learning_rate": 4.434894541520862e-06,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25295132398605347,
"step": 3480,
"valid_targets_mean": 2842.1,
"valid_targets_min": 863
},
{
"epoch": 5.648298217179903,
"grad_norm": 0.7231262588490622,
"learning_rate": 4.3842690892887795e-06,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3111575245857239,
"step": 3485,
"valid_targets_mean": 3719.8,
"valid_targets_min": 745
},
{
"epoch": 5.656401944894651,
"grad_norm": 0.6158823413371348,
"learning_rate": 4.333898655974484e-06,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26768383383750916,
"step": 3490,
"valid_targets_mean": 4432.0,
"valid_targets_min": 1369
},
{
"epoch": 5.6645056726094,
"grad_norm": 0.8979021634703408,
"learning_rate": 4.283784064172405e-06,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32060831785202026,
"step": 3495,
"valid_targets_mean": 3322.2,
"valid_targets_min": 828
},
{
"epoch": 5.672609400324149,
"grad_norm": 0.5686930143372391,
"learning_rate": 4.233926132298867e-06,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24507595598697662,
"step": 3500,
"valid_targets_mean": 6302.6,
"valid_targets_min": 968
},
{
"epoch": 5.680713128038898,
"grad_norm": 0.4277289698869093,
"learning_rate": 4.1843256745787e-06,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2321561872959137,
"step": 3505,
"valid_targets_mean": 8880.2,
"valid_targets_min": 2792
},
{
"epoch": 5.688816855753647,
"grad_norm": 0.8297040218872506,
"learning_rate": 4.134983501031942e-06,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2722494900226593,
"step": 3510,
"valid_targets_mean": 3655.5,
"valid_targets_min": 874
},
{
"epoch": 5.696920583468396,
"grad_norm": 0.7829749027309345,
"learning_rate": 4.085900417460633e-06,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4337892532348633,
"step": 3515,
"valid_targets_mean": 3732.4,
"valid_targets_min": 733
},
{
"epoch": 5.705024311183144,
"grad_norm": 0.8126084942082932,
"learning_rate": 4.037077225435628e-06,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28513067960739136,
"step": 3520,
"valid_targets_mean": 2776.5,
"valid_targets_min": 1013
},
{
"epoch": 5.713128038897893,
"grad_norm": 0.8953819330769611,
"learning_rate": 3.988514722283523e-06,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3385658860206604,
"step": 3525,
"valid_targets_mean": 2753.9,
"valid_targets_min": 1290
},
{
"epoch": 5.721231766612641,
"grad_norm": 0.6417576970627987,
"learning_rate": 3.940213701073636e-06,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606130838394165,
"step": 3530,
"valid_targets_mean": 4978.7,
"valid_targets_min": 752
},
{
"epoch": 5.72933549432739,
"grad_norm": 0.594036263261497,
"learning_rate": 3.892174950605039e-06,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24494385719299316,
"step": 3535,
"valid_targets_mean": 4648.3,
"valid_targets_min": 696
},
{
"epoch": 5.7374392220421395,
"grad_norm": 0.674852622493003,
"learning_rate": 3.844399255393705e-06,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30853283405303955,
"step": 3540,
"valid_targets_mean": 5255.0,
"valid_targets_min": 1038
},
{
"epoch": 5.745542949756889,
"grad_norm": 0.801058537021668,
"learning_rate": 3.7968873956596563e-06,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3078470826148987,
"step": 3545,
"valid_targets_mean": 3194.4,
"valid_targets_min": 1115
},
{
"epoch": 5.753646677471637,
"grad_norm": 0.7048342023609044,
"learning_rate": 3.749640147314264e-06,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24763602018356323,
"step": 3550,
"valid_targets_mean": 3711.5,
"valid_targets_min": 1193
},
{
"epoch": 5.761750405186386,
"grad_norm": 0.7693710636718659,
"learning_rate": 3.7026582819475443e-06,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23135964572429657,
"step": 3555,
"valid_targets_mean": 3138.4,
"valid_targets_min": 1205
},
{
"epoch": 5.769854132901134,
"grad_norm": 0.6632199872131253,
"learning_rate": 3.6559425668155733e-06,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27239274978637695,
"step": 3560,
"valid_targets_mean": 4193.6,
"valid_targets_min": 1230
},
{
"epoch": 5.777957860615883,
"grad_norm": 0.718545305799666,
"learning_rate": 3.6094937648279647e-06,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2218991219997406,
"step": 3565,
"valid_targets_mean": 5719.2,
"valid_targets_min": 867
},
{
"epoch": 5.786061588330632,
"grad_norm": 0.7244639386188173,
"learning_rate": 3.563312634535383e-06,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30564481019973755,
"step": 3570,
"valid_targets_mean": 3467.5,
"valid_targets_min": 967
},
{
"epoch": 5.7941653160453805,
"grad_norm": 0.5617300881909284,
"learning_rate": 3.517399930117196e-06,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33648714423179626,
"step": 3575,
"valid_targets_mean": 5446.6,
"valid_targets_min": 964
},
{
"epoch": 5.80226904376013,
"grad_norm": 0.6597389907883395,
"learning_rate": 3.4717564013691087e-06,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2604525685310364,
"step": 3580,
"valid_targets_mean": 3790.9,
"valid_targets_min": 1105
},
{
"epoch": 5.810372771474879,
"grad_norm": 0.7745748020298397,
"learning_rate": 3.4263827936909744e-06,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2584492266178131,
"step": 3585,
"valid_targets_mean": 3191.6,
"valid_targets_min": 1160
},
{
"epoch": 5.818476499189627,
"grad_norm": 0.6810368699743038,
"learning_rate": 3.38127984807457e-06,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27961236238479614,
"step": 3590,
"valid_targets_mean": 3924.9,
"valid_targets_min": 1286
},
{
"epoch": 5.826580226904376,
"grad_norm": 0.6841769486834594,
"learning_rate": 3.3364483010915237e-06,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27105721831321716,
"step": 3595,
"valid_targets_mean": 4534.7,
"valid_targets_min": 1292
},
{
"epoch": 5.834683954619125,
"grad_norm": 0.6233870726744284,
"learning_rate": 3.2918888848812913e-06,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30562299489974976,
"step": 3600,
"valid_targets_mean": 4270.6,
"valid_targets_min": 870
},
{
"epoch": 5.842787682333873,
"grad_norm": 0.8764854670185418,
"learning_rate": 3.2476023271391698e-06,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34314560890197754,
"step": 3605,
"valid_targets_mean": 2687.0,
"valid_targets_min": 741
},
{
"epoch": 5.8508914100486225,
"grad_norm": 0.7598308829904862,
"learning_rate": 3.2035893511044524e-06,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2514714300632477,
"step": 3610,
"valid_targets_mean": 4512.1,
"valid_targets_min": 1199
},
{
"epoch": 5.858995137763371,
"grad_norm": 0.685998691912319,
"learning_rate": 3.159850675548577e-06,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35390257835388184,
"step": 3615,
"valid_targets_mean": 4823.4,
"valid_targets_min": 1638
},
{
"epoch": 5.86709886547812,
"grad_norm": 0.7124267141614449,
"learning_rate": 3.116387014763429e-06,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29345035552978516,
"step": 3620,
"valid_targets_mean": 3753.6,
"valid_targets_min": 1064
},
{
"epoch": 5.875202593192869,
"grad_norm": 0.6137149594151944,
"learning_rate": 3.073199078549638e-06,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540719509124756,
"step": 3625,
"valid_targets_mean": 5363.9,
"valid_targets_min": 1437
},
{
"epoch": 5.883306320907618,
"grad_norm": 0.6867497382371595,
"learning_rate": 3.0302875722050064e-06,
"loss": 0.2714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29915332794189453,
"step": 3630,
"valid_targets_mean": 3797.4,
"valid_targets_min": 964
},
{
"epoch": 5.891410048622366,
"grad_norm": 0.6615681011902053,
"learning_rate": 2.987653196513003e-06,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24344134330749512,
"step": 3635,
"valid_targets_mean": 4025.9,
"valid_targets_min": 918
},
{
"epoch": 5.899513776337115,
"grad_norm": 0.7630726256680385,
"learning_rate": 2.9452966477312815e-06,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2798713743686676,
"step": 3640,
"valid_targets_mean": 3439.8,
"valid_targets_min": 1266
},
{
"epoch": 5.9076175040518635,
"grad_norm": 0.7157631234965041,
"learning_rate": 2.9032186175803545e-06,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2654950022697449,
"step": 3645,
"valid_targets_mean": 3439.6,
"valid_targets_min": 868
},
{
"epoch": 5.915721231766613,
"grad_norm": 0.907754147422762,
"learning_rate": 2.8614197932322585e-06,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148188591003418,
"step": 3650,
"valid_targets_mean": 2466.9,
"valid_targets_min": 991
},
{
"epoch": 5.923824959481362,
"grad_norm": 0.6769846106042888,
"learning_rate": 2.819900857299358e-06,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29736822843551636,
"step": 3655,
"valid_targets_mean": 4191.1,
"valid_targets_min": 1110
},
{
"epoch": 5.93192868719611,
"grad_norm": 0.7096793380763345,
"learning_rate": 2.778662487823187e-06,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.283025860786438,
"step": 3660,
"valid_targets_mean": 4360.5,
"valid_targets_min": 1225
},
{
"epoch": 5.940032414910859,
"grad_norm": 0.616843225159254,
"learning_rate": 2.7377053582633652e-06,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597149610519409,
"step": 3665,
"valid_targets_mean": 5154.5,
"valid_targets_min": 1217
},
{
"epoch": 5.948136142625608,
"grad_norm": 0.6764261015597512,
"learning_rate": 2.6970301374866337e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24780400097370148,
"step": 3670,
"valid_targets_mean": 3628.2,
"valid_targets_min": 1129
},
{
"epoch": 5.956239870340356,
"grad_norm": 0.8480710671748108,
"learning_rate": 2.656637489755889e-06,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29920557141304016,
"step": 3675,
"valid_targets_mean": 2949.8,
"valid_targets_min": 1047
},
{
"epoch": 5.964343598055105,
"grad_norm": 0.6732019095661717,
"learning_rate": 2.616528074719371e-06,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520577609539032,
"step": 3680,
"valid_targets_mean": 4207.6,
"valid_targets_min": 1149
},
{
"epoch": 5.9724473257698545,
"grad_norm": 0.8349743498637383,
"learning_rate": 2.576702547399863e-06,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27137356996536255,
"step": 3685,
"valid_targets_mean": 2445.9,
"valid_targets_min": 1142
},
{
"epoch": 5.980551053484603,
"grad_norm": 0.7106954338129656,
"learning_rate": 2.53716155818402e-06,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.336696982383728,
"step": 3690,
"valid_targets_mean": 3873.4,
"valid_targets_min": 1243
},
{
"epoch": 5.988654781199352,
"grad_norm": 0.58917163595744,
"learning_rate": 2.49790575281172e-06,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2684072256088257,
"step": 3695,
"valid_targets_mean": 5289.0,
"valid_targets_min": 1147
},
{
"epoch": 5.9967585089141,
"grad_norm": 0.6606555154321343,
"learning_rate": 2.4589357723655405e-06,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25777506828308105,
"step": 3700,
"valid_targets_mean": 4293.9,
"valid_targets_min": 1889
},
{
"epoch": 6.004862236628849,
"grad_norm": 0.7027728413429737,
"learning_rate": 2.4202522532602846e-06,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2268795222043991,
"step": 3705,
"valid_targets_mean": 3399.1,
"valid_targets_min": 1036
},
{
"epoch": 6.012965964343598,
"grad_norm": 0.8011004209420672,
"learning_rate": 2.381855827232571e-06,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30303099751472473,
"step": 3710,
"valid_targets_mean": 2753.8,
"valid_targets_min": 952
},
{
"epoch": 6.021069692058346,
"grad_norm": 0.7622833107404628,
"learning_rate": 2.343747121330544e-06,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26210296154022217,
"step": 3715,
"valid_targets_mean": 3469.6,
"valid_targets_min": 1178
},
{
"epoch": 6.0291734197730955,
"grad_norm": 0.7214806571727383,
"learning_rate": 2.3059267579036183e-06,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521173655986786,
"step": 3720,
"valid_targets_mean": 3284.3,
"valid_targets_min": 998
},
{
"epoch": 6.037277147487845,
"grad_norm": 0.6902303351345986,
"learning_rate": 2.268395354592312e-06,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26502299308776855,
"step": 3725,
"valid_targets_mean": 4875.6,
"valid_targets_min": 1562
},
{
"epoch": 6.045380875202593,
"grad_norm": 0.7867477709532921,
"learning_rate": 2.2311535243181637e-06,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3001806139945984,
"step": 3730,
"valid_targets_mean": 3108.7,
"valid_targets_min": 1243
},
{
"epoch": 6.053484602917342,
"grad_norm": 0.8415320330661212,
"learning_rate": 2.1942018752737227e-06,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2877800464630127,
"step": 3735,
"valid_targets_mean": 2779.1,
"valid_targets_min": 1008
},
{
"epoch": 6.061588330632091,
"grad_norm": 0.8195152807284035,
"learning_rate": 2.1575410109126293e-06,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24368160963058472,
"step": 3740,
"valid_targets_mean": 2967.5,
"valid_targets_min": 1730
},
{
"epoch": 6.069692058346839,
"grad_norm": 0.6479699003172938,
"learning_rate": 2.121171529939734e-06,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2409634292125702,
"step": 3745,
"valid_targets_mean": 4277.7,
"valid_targets_min": 1205
},
{
"epoch": 6.077795786061588,
"grad_norm": 0.552108099887294,
"learning_rate": 2.085094026301349e-06,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2244204431772232,
"step": 3750,
"valid_targets_mean": 5570.9,
"valid_targets_min": 1132
},
{
"epoch": 6.085899513776337,
"grad_norm": 0.694523046518939,
"learning_rate": 2.0493090891755262e-06,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28496766090393066,
"step": 3755,
"valid_targets_mean": 4118.6,
"valid_targets_min": 934
},
{
"epoch": 6.094003241491086,
"grad_norm": 0.7428603071136939,
"learning_rate": 2.013817302962444e-06,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2954471707344055,
"step": 3760,
"valid_targets_mean": 4566.4,
"valid_targets_min": 1867
},
{
"epoch": 6.102106969205835,
"grad_norm": 0.6670308940945041,
"learning_rate": 1.9786192472748643e-06,
"loss": 0.3101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2413603663444519,
"step": 3765,
"valid_targets_mean": 3763.2,
"valid_targets_min": 1012
},
{
"epoch": 6.110210696920584,
"grad_norm": 0.6184485991768255,
"learning_rate": 1.9437154969286577e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21730905771255493,
"step": 3770,
"valid_targets_mean": 4136.2,
"valid_targets_min": 1242
},
{
"epoch": 6.118314424635332,
"grad_norm": 0.8396579659658009,
"learning_rate": 1.9091066219334365e-06,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086123466491699,
"step": 3775,
"valid_targets_mean": 3251.0,
"valid_targets_min": 1051
},
{
"epoch": 6.126418152350081,
"grad_norm": 0.7996562551138828,
"learning_rate": 1.8747931874832325e-06,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31810393929481506,
"step": 3780,
"valid_targets_mean": 3095.3,
"valid_targets_min": 887
},
{
"epoch": 6.13452188006483,
"grad_norm": 0.7835295163411242,
"learning_rate": 1.8407757539472548e-06,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26433265209198,
"step": 3785,
"valid_targets_mean": 2967.4,
"valid_targets_min": 1040
},
{
"epoch": 6.1426256077795784,
"grad_norm": 0.671422897302015,
"learning_rate": 1.8070548768607744e-06,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25956496596336365,
"step": 3790,
"valid_targets_mean": 4248.0,
"valid_targets_min": 1536
},
{
"epoch": 6.1507293354943275,
"grad_norm": 0.7640652471884006,
"learning_rate": 1.773631106915996e-06,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2866196632385254,
"step": 3795,
"valid_targets_mean": 3140.5,
"valid_targets_min": 865
},
{
"epoch": 6.158833063209076,
"grad_norm": 0.7901497100315298,
"learning_rate": 1.740504989953129e-06,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26567843556404114,
"step": 3800,
"valid_targets_mean": 2979.9,
"valid_targets_min": 886
},
{
"epoch": 6.166936790923825,
"grad_norm": 0.7775483944222201,
"learning_rate": 1.707677066951432e-06,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2601214349269867,
"step": 3805,
"valid_targets_mean": 3538.1,
"valid_targets_min": 1217
},
{
"epoch": 6.175040518638574,
"grad_norm": 0.6915414702499607,
"learning_rate": 1.6751478740203776e-06,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2392570823431015,
"step": 3810,
"valid_targets_mean": 4333.6,
"valid_targets_min": 886
},
{
"epoch": 6.183144246353322,
"grad_norm": 0.7120258292651832,
"learning_rate": 1.6429179423909248e-06,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25904911756515503,
"step": 3815,
"valid_targets_mean": 4281.4,
"valid_targets_min": 1739
},
{
"epoch": 6.191247974068071,
"grad_norm": 0.6073873394357148,
"learning_rate": 1.6109877984068089e-06,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2905542850494385,
"step": 3820,
"valid_targets_mean": 5658.9,
"valid_targets_min": 1019
},
{
"epoch": 6.19935170178282,
"grad_norm": 0.6940476997510958,
"learning_rate": 1.5793579635159883e-06,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291831910610199,
"step": 3825,
"valid_targets_mean": 4014.4,
"valid_targets_min": 1211
},
{
"epoch": 6.207455429497569,
"grad_norm": 0.6769492704139075,
"learning_rate": 1.5480289542620686e-06,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24061062932014465,
"step": 3830,
"valid_targets_mean": 4078.7,
"valid_targets_min": 868
},
{
"epoch": 6.215559157212318,
"grad_norm": 0.8350367658236924,
"learning_rate": 1.517001282275936e-06,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2500787377357483,
"step": 3835,
"valid_targets_mean": 3799.4,
"valid_targets_min": 1227
},
{
"epoch": 6.223662884927067,
"grad_norm": 0.651123871111124,
"learning_rate": 1.486275454267354e-06,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3093678951263428,
"step": 3840,
"valid_targets_mean": 5790.4,
"valid_targets_min": 1183
},
{
"epoch": 6.231766612641815,
"grad_norm": 0.5701257680611536,
"learning_rate": 1.4558519720166975e-06,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2544712722301483,
"step": 3845,
"valid_targets_mean": 5241.6,
"valid_targets_min": 1120
},
{
"epoch": 6.239870340356564,
"grad_norm": 0.7056219502775309,
"learning_rate": 1.4257313323667798e-06,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31050872802734375,
"step": 3850,
"valid_targets_mean": 4014.6,
"valid_targets_min": 1203
},
{
"epoch": 6.247974068071313,
"grad_norm": 0.7262226243616173,
"learning_rate": 1.3959140272146998e-06,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27195703983306885,
"step": 3855,
"valid_targets_mean": 3768.8,
"valid_targets_min": 2037
},
{
"epoch": 6.256077795786061,
"grad_norm": 0.6357702807995875,
"learning_rate": 1.366400543503854e-06,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24853156507015228,
"step": 3860,
"valid_targets_mean": 4364.2,
"valid_targets_min": 969
},
{
"epoch": 6.2641815235008105,
"grad_norm": 0.766510336947776,
"learning_rate": 1.3371913632159506e-06,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2552717328071594,
"step": 3865,
"valid_targets_mean": 4211.0,
"valid_targets_min": 1164
},
{
"epoch": 6.272285251215559,
"grad_norm": 0.814344839562171,
"learning_rate": 1.3082869633631413e-06,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.299882709980011,
"step": 3870,
"valid_targets_mean": 2909.2,
"valid_targets_min": 1160
},
{
"epoch": 6.280388978930308,
"grad_norm": 0.7162700671892775,
"learning_rate": 1.2796878159802595e-06,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3379451632499695,
"step": 3875,
"valid_targets_mean": 4513.4,
"valid_targets_min": 1267
},
{
"epoch": 6.288492706645057,
"grad_norm": 0.7166231616916816,
"learning_rate": 1.2513943881170754e-06,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2593461871147156,
"step": 3880,
"valid_targets_mean": 3996.0,
"valid_targets_min": 1093
},
{
"epoch": 6.296596434359805,
"grad_norm": 0.7960125938291805,
"learning_rate": 1.2234071418306903e-06,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2560000419616699,
"step": 3885,
"valid_targets_mean": 2943.4,
"valid_targets_min": 1091
},
{
"epoch": 6.304700162074554,
"grad_norm": 0.7909822999764351,
"learning_rate": 1.1957265341779855e-06,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2831363379955292,
"step": 3890,
"valid_targets_mean": 2929.0,
"valid_targets_min": 1313
},
{
"epoch": 6.312803889789303,
"grad_norm": 0.8078944578627083,
"learning_rate": 1.1683530172081592e-06,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28948408365249634,
"step": 3895,
"valid_targets_mean": 3166.2,
"valid_targets_min": 826
},
{
"epoch": 6.3209076175040515,
"grad_norm": 0.6503889422727751,
"learning_rate": 1.1412870379553387e-06,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851935029029846,
"step": 3900,
"valid_targets_mean": 5278.4,
"valid_targets_min": 1216
},
{
"epoch": 6.329011345218801,
"grad_norm": 0.7095808115759376,
"learning_rate": 1.1145290384312846e-06,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966817617416382,
"step": 3905,
"valid_targets_mean": 3949.7,
"valid_targets_min": 344
},
{
"epoch": 6.33711507293355,
"grad_norm": 0.5713953001792478,
"learning_rate": 1.0880794556181762e-06,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26881951093673706,
"step": 3910,
"valid_targets_mean": 5394.6,
"valid_targets_min": 1396
},
{
"epoch": 6.345218800648298,
"grad_norm": 0.8057022743278727,
"learning_rate": 1.0619387214614662e-06,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28803229331970215,
"step": 3915,
"valid_targets_mean": 3252.2,
"valid_targets_min": 1268
},
{
"epoch": 6.353322528363047,
"grad_norm": 0.656199813723134,
"learning_rate": 1.0361072628628354e-06,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23762132227420807,
"step": 3920,
"valid_targets_mean": 4280.4,
"valid_targets_min": 813
},
{
"epoch": 6.361426256077796,
"grad_norm": 0.5444634341534144,
"learning_rate": 1.0105855016732113e-06,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2526979148387909,
"step": 3925,
"valid_targets_mean": 6552.8,
"valid_targets_min": 1364
},
{
"epoch": 6.369529983792544,
"grad_norm": 0.7191276204333831,
"learning_rate": 9.853738546858893e-07,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3756384253501892,
"step": 3930,
"valid_targets_mean": 4363.0,
"valid_targets_min": 628
},
{
"epoch": 6.377633711507293,
"grad_norm": 0.6072164246303409,
"learning_rate": 9.604727336297203e-07,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21978111565113068,
"step": 3935,
"valid_targets_mean": 4838.1,
"valid_targets_min": 1210
},
{
"epoch": 6.3857374392220425,
"grad_norm": 0.8535219826727345,
"learning_rate": 9.358825451623832e-07,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3109622001647949,
"step": 3940,
"valid_targets_mean": 2759.0,
"valid_targets_min": 1075
},
{
"epoch": 6.393841166936791,
"grad_norm": 0.8018109420542197,
"learning_rate": 9.116036908637582e-07,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27665650844573975,
"step": 3945,
"valid_targets_mean": 3128.8,
"valid_targets_min": 1066
},
{
"epoch": 6.40194489465154,
"grad_norm": 0.6118808079483848,
"learning_rate": 8.876365672293441e-07,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24101707339286804,
"step": 3950,
"valid_targets_mean": 5033.9,
"valid_targets_min": 1184
},
{
"epoch": 6.410048622366288,
"grad_norm": 0.6738977504802829,
"learning_rate": 8.639815656638162e-07,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23450031876564026,
"step": 3955,
"valid_targets_mean": 4632.9,
"valid_targets_min": 1016
},
{
"epoch": 6.418152350081037,
"grad_norm": 0.6578666448021531,
"learning_rate": 8.406390724745961e-07,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25716516375541687,
"step": 3960,
"valid_targets_mean": 4409.2,
"valid_targets_min": 1423
},
{
"epoch": 6.426256077795786,
"grad_norm": 0.7504549153226855,
"learning_rate": 8.176094688655789e-07,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24591027200222015,
"step": 3965,
"valid_targets_mean": 3898.1,
"valid_targets_min": 1247
},
{
"epoch": 6.434359805510534,
"grad_norm": 0.716758853434586,
"learning_rate": 7.948931309308872e-07,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2400793880224228,
"step": 3970,
"valid_targets_mean": 3711.0,
"valid_targets_min": 815
},
{
"epoch": 6.4424635332252835,
"grad_norm": 0.6187434162303004,
"learning_rate": 7.724904296487246e-07,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.240831196308136,
"step": 3975,
"valid_targets_mean": 4534.2,
"valid_targets_min": 1314
},
{
"epoch": 6.450567260940033,
"grad_norm": 0.7413645604300104,
"learning_rate": 7.504017308753386e-07,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26031699776649475,
"step": 3980,
"valid_targets_mean": 3497.0,
"valid_targets_min": 985
},
{
"epoch": 6.458670988654781,
"grad_norm": 0.6834988461746635,
"learning_rate": 7.286273953390278e-07,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3183531165122986,
"step": 3985,
"valid_targets_mean": 4240.6,
"valid_targets_min": 895
},
{
"epoch": 6.46677471636953,
"grad_norm": 0.7125067985322497,
"learning_rate": 7.071677786342568e-07,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23387478291988373,
"step": 3990,
"valid_targets_mean": 4085.0,
"valid_targets_min": 1346
},
{
"epoch": 6.474878444084279,
"grad_norm": 0.5676104505322674,
"learning_rate": 6.860232312158554e-07,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.215545192360878,
"step": 3995,
"valid_targets_mean": 5310.1,
"valid_targets_min": 1485
},
{
"epoch": 6.482982171799027,
"grad_norm": 0.8287830712031203,
"learning_rate": 6.651940983932737e-07,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28875142335891724,
"step": 4000,
"valid_targets_mean": 2980.1,
"valid_targets_min": 1046
},
{
"epoch": 6.491085899513776,
"grad_norm": 0.567888858150834,
"learning_rate": 6.44680720324975e-07,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2143402099609375,
"step": 4005,
"valid_targets_mean": 4987.5,
"valid_targets_min": 1468
},
{
"epoch": 6.4991896272285254,
"grad_norm": 0.8657516748787141,
"learning_rate": 6.244834320128501e-07,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904426157474518,
"step": 4010,
"valid_targets_mean": 2812.2,
"valid_targets_min": 1016
},
{
"epoch": 6.507293354943274,
"grad_norm": 0.6802979979107128,
"learning_rate": 6.0460256329677e-07,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2284238040447235,
"step": 4015,
"valid_targets_mean": 3829.1,
"valid_targets_min": 999
},
{
"epoch": 6.515397082658023,
"grad_norm": 0.6616469553258651,
"learning_rate": 5.850384388491814e-07,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26627442240715027,
"step": 4020,
"valid_targets_mean": 4338.4,
"valid_targets_min": 1301
},
{
"epoch": 6.523500810372772,
"grad_norm": 0.7578702676971412,
"learning_rate": 5.657913781698221e-07,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26661694049835205,
"step": 4025,
"valid_targets_mean": 3835.7,
"valid_targets_min": 1097
},
{
"epoch": 6.53160453808752,
"grad_norm": 0.8009653624376153,
"learning_rate": 5.468616955804873e-07,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3027913570404053,
"step": 4030,
"valid_targets_mean": 3376.9,
"valid_targets_min": 1041
},
{
"epoch": 6.539708265802269,
"grad_norm": 0.7130215275679384,
"learning_rate": 5.282497002198983e-07,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25583645701408386,
"step": 4035,
"valid_targets_mean": 3905.9,
"valid_targets_min": 1207
},
{
"epoch": 6.547811993517017,
"grad_norm": 0.7385392471080525,
"learning_rate": 5.099556960386686e-07,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25842177867889404,
"step": 4040,
"valid_targets_mean": 3477.1,
"valid_targets_min": 1364
},
{
"epoch": 6.5559157212317665,
"grad_norm": 0.974897501639828,
"learning_rate": 4.919799817943238e-07,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050478398799896,
"step": 4045,
"valid_targets_mean": 2837.5,
"valid_targets_min": 1061
},
{
"epoch": 6.564019448946516,
"grad_norm": 0.6798897469940042,
"learning_rate": 4.7432285104642703e-07,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23295563459396362,
"step": 4050,
"valid_targets_mean": 4162.9,
"valid_targets_min": 1044
},
{
"epoch": 6.572123176661265,
"grad_norm": 0.7307056993453411,
"learning_rate": 4.569845921517968e-07,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25635001063346863,
"step": 4055,
"valid_targets_mean": 3471.1,
"valid_targets_min": 1188
},
{
"epoch": 6.580226904376013,
"grad_norm": 0.6997105951135152,
"learning_rate": 4.399654882597726e-07,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000991642475128,
"step": 4060,
"valid_targets_mean": 4791.9,
"valid_targets_min": 1107
},
{
"epoch": 6.588330632090762,
"grad_norm": 0.7720123442423956,
"learning_rate": 4.232658173076232e-07,
"loss": 0.2587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2398601472377777,
"step": 4065,
"valid_targets_mean": 3633.2,
"valid_targets_min": 971
},
{
"epoch": 6.59643435980551,
"grad_norm": 0.667849292616193,
"learning_rate": 4.068858520159724e-07,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535744905471802,
"step": 4070,
"valid_targets_mean": 4069.8,
"valid_targets_min": 1143
},
{
"epoch": 6.604538087520259,
"grad_norm": 0.5638956199207986,
"learning_rate": 3.9082585988437617e-07,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24108228087425232,
"step": 4075,
"valid_targets_mean": 5918.1,
"valid_targets_min": 1143
},
{
"epoch": 6.612641815235008,
"grad_norm": 0.6112457385056609,
"learning_rate": 3.7508610318693684e-07,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21963872015476227,
"step": 4080,
"valid_targets_mean": 4737.4,
"valid_targets_min": 1405
},
{
"epoch": 6.620745542949757,
"grad_norm": 1.0780947655547286,
"learning_rate": 3.596668389680247e-07,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27150118350982666,
"step": 4085,
"valid_targets_mean": 3611.4,
"valid_targets_min": 1160
},
{
"epoch": 6.628849270664506,
"grad_norm": 0.6071034680621801,
"learning_rate": 3.445683190380833e-07,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29520419239997864,
"step": 4090,
"valid_targets_mean": 6065.9,
"valid_targets_min": 1438
},
{
"epoch": 6.636952998379255,
"grad_norm": 0.6734164739619142,
"learning_rate": 3.297907899695019e-07,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27870097756385803,
"step": 4095,
"valid_targets_mean": 3903.8,
"valid_targets_min": 1070
},
{
"epoch": 6.645056726094003,
"grad_norm": 0.840649714564737,
"learning_rate": 3.1533449309262056e-07,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556115686893463,
"step": 4100,
"valid_targets_mean": 3202.4,
"valid_targets_min": 733
},
{
"epoch": 6.653160453808752,
"grad_norm": 0.8751889443011073,
"learning_rate": 3.0119966449174474e-07,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3118496537208557,
"step": 4105,
"valid_targets_mean": 4041.4,
"valid_targets_min": 1145
},
{
"epoch": 6.661264181523501,
"grad_norm": 0.7587472130380253,
"learning_rate": 2.8738653500133494e-07,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707531452178955,
"step": 4110,
"valid_targets_mean": 4125.2,
"valid_targets_min": 1152
},
{
"epoch": 6.669367909238249,
"grad_norm": 0.8004779128159383,
"learning_rate": 2.738953302022096e-07,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31876587867736816,
"step": 4115,
"valid_targets_mean": 3345.1,
"valid_targets_min": 1158
},
{
"epoch": 6.6774716369529985,
"grad_norm": 0.6332081406992072,
"learning_rate": 2.6072627041785925e-07,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23436513543128967,
"step": 4120,
"valid_targets_mean": 4620.5,
"valid_targets_min": 1546
},
{
"epoch": 6.685575364667747,
"grad_norm": 0.5678494967037826,
"learning_rate": 2.478795707108672e-07,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23043310642242432,
"step": 4125,
"valid_targets_mean": 4959.5,
"valid_targets_min": 1162
},
{
"epoch": 6.693679092382496,
"grad_norm": 0.630783160958136,
"learning_rate": 2.3535544087938345e-07,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515913248062134,
"step": 4130,
"valid_targets_mean": 4601.9,
"valid_targets_min": 1579
},
{
"epoch": 6.701782820097245,
"grad_norm": 1.0053058271111657,
"learning_rate": 2.2315408545370288e-07,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27254045009613037,
"step": 4135,
"valid_targets_mean": 2783.1,
"valid_targets_min": 1009
},
{
"epoch": 6.709886547811994,
"grad_norm": 0.6409152830997872,
"learning_rate": 2.1127570369292361e-07,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27788475155830383,
"step": 4140,
"valid_targets_mean": 5011.4,
"valid_targets_min": 1106
},
{
"epoch": 6.717990275526742,
"grad_norm": 0.6392402407017796,
"learning_rate": 1.9972048958168954e-07,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23322021961212158,
"step": 4145,
"valid_targets_mean": 4512.9,
"valid_targets_min": 1069
},
{
"epoch": 6.726094003241491,
"grad_norm": 0.6358548166174536,
"learning_rate": 1.8848863182703513e-07,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605475187301636,
"step": 4150,
"valid_targets_mean": 3927.9,
"valid_targets_min": 1140
},
{
"epoch": 6.7341977309562395,
"grad_norm": 0.671040397851917,
"learning_rate": 1.7758031385528784e-07,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39784008264541626,
"step": 4155,
"valid_targets_mean": 4703.1,
"valid_targets_min": 1170
},
{
"epoch": 6.742301458670989,
"grad_norm": 0.7726852582259216,
"learning_rate": 1.6699571380908385e-07,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32319122552871704,
"step": 4160,
"valid_targets_mean": 3434.7,
"valid_targets_min": 710
},
{
"epoch": 6.750405186385738,
"grad_norm": 0.7122432763736924,
"learning_rate": 1.5673500454445046e-07,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571845054626465,
"step": 4165,
"valid_targets_mean": 3780.6,
"valid_targets_min": 1323
},
{
"epoch": 6.758508914100486,
"grad_norm": 0.7328015093005262,
"learning_rate": 1.4679835362799266e-07,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29261136054992676,
"step": 4170,
"valid_targets_mean": 4295.0,
"valid_targets_min": 463
},
{
"epoch": 6.766612641815235,
"grad_norm": 0.6595980272648833,
"learning_rate": 1.3718592333414881e-07,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2447427660226822,
"step": 4175,
"valid_targets_mean": 4700.2,
"valid_targets_min": 1429
},
{
"epoch": 6.774716369529984,
"grad_norm": 0.74623136258456,
"learning_rate": 1.2789787064253934e-07,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32457369565963745,
"step": 4180,
"valid_targets_mean": 4794.1,
"valid_targets_min": 361
},
{
"epoch": 6.782820097244732,
"grad_norm": 0.6387805597272295,
"learning_rate": 1.1893434723541542e-07,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.247330904006958,
"step": 4185,
"valid_targets_mean": 5098.8,
"valid_targets_min": 1586
},
{
"epoch": 6.790923824959481,
"grad_norm": 0.7914446560492252,
"learning_rate": 1.1029549949516549e-07,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25566303730010986,
"step": 4190,
"valid_targets_mean": 2928.6,
"valid_targets_min": 1435
},
{
"epoch": 6.7990275526742305,
"grad_norm": 0.6784435117492335,
"learning_rate": 1.0198146850193935e-07,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23428568243980408,
"step": 4195,
"valid_targets_mean": 4123.6,
"valid_targets_min": 1070
},
{
"epoch": 6.807131280388979,
"grad_norm": 0.9219689586760358,
"learning_rate": 9.399239003132999e-08,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27654707431793213,
"step": 4200,
"valid_targets_mean": 2339.8,
"valid_targets_min": 347
},
{
"epoch": 6.815235008103728,
"grad_norm": 0.9992054972300621,
"learning_rate": 8.632839455216869e-08,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3159137964248657,
"step": 4205,
"valid_targets_mean": 2398.5,
"valid_targets_min": 1235
},
{
"epoch": 6.823338735818476,
"grad_norm": 0.7850895651410487,
"learning_rate": 7.89896072243912e-08,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29079508781433105,
"step": 4210,
"valid_targets_mean": 3143.6,
"valid_targets_min": 1413
},
{
"epoch": 6.831442463533225,
"grad_norm": 1.0537086856892872,
"learning_rate": 7.197614789698604e-08,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2822344899177551,
"step": 4215,
"valid_targets_mean": 3394.4,
"valid_targets_min": 983
},
{
"epoch": 6.839546191247974,
"grad_norm": 0.8211601548625681,
"learning_rate": 6.528813110604714e-08,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31433653831481934,
"step": 4220,
"valid_targets_mean": 2904.8,
"valid_targets_min": 1244
},
{
"epoch": 6.847649918962723,
"grad_norm": 0.8759060227159305,
"learning_rate": 5.8925666072899845e-08,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29553893208503723,
"step": 4225,
"valid_targets_mean": 3257.2,
"valid_targets_min": 1018
},
{
"epoch": 6.855753646677472,
"grad_norm": 0.8027670263828199,
"learning_rate": 5.288885670231336e-08,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29728516936302185,
"step": 4230,
"valid_targets_mean": 3178.8,
"valid_targets_min": 1256
},
{
"epoch": 6.863857374392221,
"grad_norm": 0.6309128871254511,
"learning_rate": 4.717780158080887e-08,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22423002123832703,
"step": 4235,
"valid_targets_mean": 4645.9,
"valid_targets_min": 1714
},
{
"epoch": 6.871961102106969,
"grad_norm": 0.7061556050034734,
"learning_rate": 4.1792593975049644e-08,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23919057846069336,
"step": 4240,
"valid_targets_mean": 3472.2,
"valid_targets_min": 1101
},
{
"epoch": 6.880064829821718,
"grad_norm": 0.7475024848941403,
"learning_rate": 3.6733321830315636e-08,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009330630302429,
"step": 4245,
"valid_targets_mean": 3434.6,
"valid_targets_min": 972
},
{
"epoch": 6.888168557536467,
"grad_norm": 0.5604792404146883,
"learning_rate": 3.200006776906461e-08,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2671416103839874,
"step": 4250,
"valid_targets_mean": 5724.2,
"valid_targets_min": 2505
},
{
"epoch": 6.896272285251215,
"grad_norm": 0.6499933621677116,
"learning_rate": 2.7592909089593224e-08,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2697727382183075,
"step": 4255,
"valid_targets_mean": 4409.6,
"valid_targets_min": 1403
},
{
"epoch": 6.904376012965964,
"grad_norm": 0.7422334882426721,
"learning_rate": 2.351191776475581e-08,
"loss": 0.2574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24201233685016632,
"step": 4260,
"valid_targets_mean": 3177.5,
"valid_targets_min": 1107
},
{
"epoch": 6.9124797406807135,
"grad_norm": 0.6139803295015263,
"learning_rate": 1.9757160440814217e-08,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602802515029907,
"step": 4265,
"valid_targets_mean": 4547.1,
"valid_targets_min": 1339
},
{
"epoch": 6.920583468395462,
"grad_norm": 0.8330992402016216,
"learning_rate": 1.6328698436327562e-08,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27471017837524414,
"step": 4270,
"valid_targets_mean": 2963.1,
"valid_targets_min": 1058
},
{
"epoch": 6.928687196110211,
"grad_norm": 0.7303505672027717,
"learning_rate": 1.3226587741159702e-08,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26886293292045593,
"step": 4275,
"valid_targets_mean": 3608.6,
"valid_targets_min": 1171
},
{
"epoch": 6.93679092382496,
"grad_norm": 0.747537768686201,
"learning_rate": 1.0450879015566629e-08,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23849567770957947,
"step": 4280,
"valid_targets_mean": 2990.4,
"valid_targets_min": 1084
},
{
"epoch": 6.944894651539708,
"grad_norm": 0.7691581570436978,
"learning_rate": 8.001617589368238e-09,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27607500553131104,
"step": 4285,
"valid_targets_mean": 3319.6,
"valid_targets_min": 1448
},
{
"epoch": 6.952998379254457,
"grad_norm": 0.7777486056188054,
"learning_rate": 5.878843461200046e-09,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2839847207069397,
"step": 4290,
"valid_targets_mean": 3421.1,
"valid_targets_min": 989
},
{
"epoch": 6.961102106969205,
"grad_norm": 0.7537030177576087,
"learning_rate": 4.082591297873695e-09,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192595839500427,
"step": 4295,
"valid_targets_mean": 3606.9,
"valid_targets_min": 1058
},
{
"epoch": 6.9692058346839545,
"grad_norm": 0.6782862771300621,
"learning_rate": 2.6128904338018624e-09,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3403030037879944,
"step": 4300,
"valid_targets_mean": 4660.7,
"valid_targets_min": 845
},
{
"epoch": 6.977309562398704,
"grad_norm": 0.6131020501214138,
"learning_rate": 1.4697648705186417e-09,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20277269184589386,
"step": 4305,
"valid_targets_mean": 4003.3,
"valid_targets_min": 1271
},
{
"epoch": 6.985413290113452,
"grad_norm": 0.71749765762531,
"learning_rate": 6.532332762931859e-10,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2628193795681,
"step": 4310,
"valid_targets_mean": 3631.9,
"valid_targets_min": 1335
},
{
"epoch": 6.993517017828201,
"grad_norm": 0.7515541884292178,
"learning_rate": 1.6330898581884414e-10,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3376891016960144,
"step": 4315,
"valid_targets_mean": 3517.7,
"valid_targets_min": 1401
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23076336085796356,
"step": 4319,
"total_flos": 1056573424926720.0,
"train_loss": 0.349568347366189,
"train_runtime": 28403.7175,
"train_samples_per_second": 2.431,
"train_steps_per_second": 0.152,
"valid_targets_mean": 5247.5,
"valid_targets_min": 1276
}
],
"logging_steps": 5,
"max_steps": 4319,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1056573424926720.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}