Files
a1-stackexchange_tor/trainer_state.json
ModelHub XC 4e63e88f3e 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-stackexchange_tor
Source: Original Platform
2026-05-11 12:32:16 +08:00

9761 lines
270 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4417,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.00792393026941363,
"grad_norm": 18.30795544148065,
"learning_rate": 3.619909502262444e-07,
"loss": 0.9909,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.0027930736541748,
"step": 5,
"valid_targets_mean": 3096.8,
"valid_targets_min": 1275
},
{
"epoch": 0.01584786053882726,
"grad_norm": 17.799072817552403,
"learning_rate": 8.144796380090498e-07,
"loss": 0.9684,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.0059874057769775,
"step": 10,
"valid_targets_mean": 2921.6,
"valid_targets_min": 959
},
{
"epoch": 0.02377179080824089,
"grad_norm": 18.446857759452225,
"learning_rate": 1.2669683257918552e-06,
"loss": 0.928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9721807241439819,
"step": 15,
"valid_targets_mean": 3334.1,
"valid_targets_min": 1196
},
{
"epoch": 0.03169572107765452,
"grad_norm": 13.528514126701259,
"learning_rate": 1.7194570135746609e-06,
"loss": 0.9344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8746083974838257,
"step": 20,
"valid_targets_mean": 3560.9,
"valid_targets_min": 1101
},
{
"epoch": 0.039619651347068144,
"grad_norm": 9.31391677104,
"learning_rate": 2.171945701357466e-06,
"loss": 0.896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8563970327377319,
"step": 25,
"valid_targets_mean": 3255.4,
"valid_targets_min": 1420
},
{
"epoch": 0.04754358161648178,
"grad_norm": 5.740949384443614,
"learning_rate": 2.624434389140272e-06,
"loss": 0.8017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7667723894119263,
"step": 30,
"valid_targets_mean": 3685.8,
"valid_targets_min": 1106
},
{
"epoch": 0.0554675118858954,
"grad_norm": 2.8043645950548908,
"learning_rate": 3.0769230769230774e-06,
"loss": 0.7712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6531684994697571,
"step": 35,
"valid_targets_mean": 4291.8,
"valid_targets_min": 1303
},
{
"epoch": 0.06339144215530904,
"grad_norm": 2.1470577969090754,
"learning_rate": 3.529411764705883e-06,
"loss": 0.7427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7266800403594971,
"step": 40,
"valid_targets_mean": 2956.1,
"valid_targets_min": 999
},
{
"epoch": 0.07131537242472266,
"grad_norm": 1.8591952619735816,
"learning_rate": 3.9819004524886875e-06,
"loss": 0.7016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7177771329879761,
"step": 45,
"valid_targets_mean": 2703.8,
"valid_targets_min": 1178
},
{
"epoch": 0.07923930269413629,
"grad_norm": 1.5113516568275136,
"learning_rate": 4.434389140271493e-06,
"loss": 0.697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7023115158081055,
"step": 50,
"valid_targets_mean": 2789.7,
"valid_targets_min": 1292
},
{
"epoch": 0.08716323296354993,
"grad_norm": 1.0994842020421405,
"learning_rate": 4.886877828054299e-06,
"loss": 0.6765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6585033535957336,
"step": 55,
"valid_targets_mean": 3465.1,
"valid_targets_min": 1032
},
{
"epoch": 0.09508716323296355,
"grad_norm": 1.9537311330380602,
"learning_rate": 5.339366515837105e-06,
"loss": 0.6928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7655017375946045,
"step": 60,
"valid_targets_mean": 2952.2,
"valid_targets_min": 932
},
{
"epoch": 0.10301109350237718,
"grad_norm": 0.9347844302177003,
"learning_rate": 5.79185520361991e-06,
"loss": 0.6466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6798193454742432,
"step": 65,
"valid_targets_mean": 3296.2,
"valid_targets_min": 558
},
{
"epoch": 0.1109350237717908,
"grad_norm": 0.820064187537382,
"learning_rate": 6.244343891402716e-06,
"loss": 0.6493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6339085102081299,
"step": 70,
"valid_targets_mean": 3473.1,
"valid_targets_min": 974
},
{
"epoch": 0.11885895404120443,
"grad_norm": 0.84149786444046,
"learning_rate": 6.69683257918552e-06,
"loss": 0.6203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5971336960792542,
"step": 75,
"valid_targets_mean": 3043.6,
"valid_targets_min": 1040
},
{
"epoch": 0.12678288431061807,
"grad_norm": 0.819875440430727,
"learning_rate": 7.1493212669683265e-06,
"loss": 0.6207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5473138093948364,
"step": 80,
"valid_targets_mean": 3087.9,
"valid_targets_min": 1250
},
{
"epoch": 0.1347068145800317,
"grad_norm": 0.937345203637578,
"learning_rate": 7.601809954751131e-06,
"loss": 0.6579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7002801895141602,
"step": 85,
"valid_targets_mean": 2635.6,
"valid_targets_min": 574
},
{
"epoch": 0.14263074484944532,
"grad_norm": 0.9146174502773798,
"learning_rate": 8.054298642533938e-06,
"loss": 0.62,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6000384092330933,
"step": 90,
"valid_targets_mean": 2494.1,
"valid_targets_min": 737
},
{
"epoch": 0.15055467511885895,
"grad_norm": 0.9169686189770018,
"learning_rate": 8.506787330316743e-06,
"loss": 0.6039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6068024039268494,
"step": 95,
"valid_targets_mean": 2555.5,
"valid_targets_min": 1085
},
{
"epoch": 0.15847860538827258,
"grad_norm": 0.9320852712314595,
"learning_rate": 8.95927601809955e-06,
"loss": 0.6062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.614492654800415,
"step": 100,
"valid_targets_mean": 2322.4,
"valid_targets_min": 923
},
{
"epoch": 0.1664025356576862,
"grad_norm": 0.7979632405521523,
"learning_rate": 9.411764705882354e-06,
"loss": 0.5937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.562329888343811,
"step": 105,
"valid_targets_mean": 3538.2,
"valid_targets_min": 511
},
{
"epoch": 0.17432646592709986,
"grad_norm": 0.7797014261938441,
"learning_rate": 9.86425339366516e-06,
"loss": 0.5676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5618658065795898,
"step": 110,
"valid_targets_mean": 3149.2,
"valid_targets_min": 813
},
{
"epoch": 0.18225039619651348,
"grad_norm": 0.7701673082038006,
"learning_rate": 1.0316742081447966e-05,
"loss": 0.5769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.561303436756134,
"step": 115,
"valid_targets_mean": 2988.9,
"valid_targets_min": 1007
},
{
"epoch": 0.1901743264659271,
"grad_norm": 0.7301022610624124,
"learning_rate": 1.076923076923077e-05,
"loss": 0.585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5721402764320374,
"step": 120,
"valid_targets_mean": 3576.1,
"valid_targets_min": 1733
},
{
"epoch": 0.19809825673534073,
"grad_norm": 0.8464639593444047,
"learning_rate": 1.1221719457013576e-05,
"loss": 0.5752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6512378454208374,
"step": 125,
"valid_targets_mean": 3244.2,
"valid_targets_min": 1307
},
{
"epoch": 0.20602218700475436,
"grad_norm": 0.7861472935507103,
"learning_rate": 1.1674208144796382e-05,
"loss": 0.5427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5997300148010254,
"step": 130,
"valid_targets_mean": 3249.4,
"valid_targets_min": 1552
},
{
"epoch": 0.21394611727416799,
"grad_norm": 0.6975163539631399,
"learning_rate": 1.2126696832579185e-05,
"loss": 0.5473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5397928953170776,
"step": 135,
"valid_targets_mean": 3848.9,
"valid_targets_min": 613
},
{
"epoch": 0.2218700475435816,
"grad_norm": 0.8396368977750472,
"learning_rate": 1.2579185520361991e-05,
"loss": 0.5497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5377547740936279,
"step": 140,
"valid_targets_mean": 2616.2,
"valid_targets_min": 1135
},
{
"epoch": 0.22979397781299524,
"grad_norm": 0.734689091691239,
"learning_rate": 1.3031674208144797e-05,
"loss": 0.5247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5179744958877563,
"step": 145,
"valid_targets_mean": 3031.5,
"valid_targets_min": 806
},
{
"epoch": 0.23771790808240886,
"grad_norm": 0.810545526512668,
"learning_rate": 1.3484162895927604e-05,
"loss": 0.5628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5749671459197998,
"step": 150,
"valid_targets_mean": 2848.2,
"valid_targets_min": 1117
},
{
"epoch": 0.24564183835182252,
"grad_norm": 0.7252435536596383,
"learning_rate": 1.3936651583710408e-05,
"loss": 0.5325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4927237033843994,
"step": 155,
"valid_targets_mean": 3464.4,
"valid_targets_min": 804
},
{
"epoch": 0.25356576862123614,
"grad_norm": 0.7835612232571453,
"learning_rate": 1.4389140271493213e-05,
"loss": 0.5614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5875840783119202,
"step": 160,
"valid_targets_mean": 3134.0,
"valid_targets_min": 1040
},
{
"epoch": 0.26148969889064977,
"grad_norm": 0.8037709330769847,
"learning_rate": 1.484162895927602e-05,
"loss": 0.555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5322756171226501,
"step": 165,
"valid_targets_mean": 2802.3,
"valid_targets_min": 1217
},
{
"epoch": 0.2694136291600634,
"grad_norm": 0.8508977275858737,
"learning_rate": 1.5294117647058822e-05,
"loss": 0.55,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5077811479568481,
"step": 170,
"valid_targets_mean": 3118.4,
"valid_targets_min": 643
},
{
"epoch": 0.277337559429477,
"grad_norm": 0.7172097062555428,
"learning_rate": 1.574660633484163e-05,
"loss": 0.5179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48911088705062866,
"step": 175,
"valid_targets_mean": 3719.6,
"valid_targets_min": 1500
},
{
"epoch": 0.28526148969889065,
"grad_norm": 0.753428022374828,
"learning_rate": 1.6199095022624435e-05,
"loss": 0.4977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5100698471069336,
"step": 180,
"valid_targets_mean": 3200.1,
"valid_targets_min": 795
},
{
"epoch": 0.2931854199683043,
"grad_norm": 0.7186918449674007,
"learning_rate": 1.6651583710407243e-05,
"loss": 0.5391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5387634038925171,
"step": 185,
"valid_targets_mean": 3925.0,
"valid_targets_min": 1582
},
{
"epoch": 0.3011093502377179,
"grad_norm": 0.8467273342860667,
"learning_rate": 1.7104072398190047e-05,
"loss": 0.5302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5354914665222168,
"step": 190,
"valid_targets_mean": 2833.6,
"valid_targets_min": 976
},
{
"epoch": 0.3090332805071315,
"grad_norm": 0.8821480809910013,
"learning_rate": 1.7556561085972852e-05,
"loss": 0.5174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5056538581848145,
"step": 195,
"valid_targets_mean": 2422.6,
"valid_targets_min": 1091
},
{
"epoch": 0.31695721077654515,
"grad_norm": 0.7440887923285217,
"learning_rate": 1.8009049773755657e-05,
"loss": 0.5504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5461665391921997,
"step": 200,
"valid_targets_mean": 3475.5,
"valid_targets_min": 953
},
{
"epoch": 0.3248811410459588,
"grad_norm": 0.8495808389526411,
"learning_rate": 1.8461538461538465e-05,
"loss": 0.5109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4988098740577698,
"step": 205,
"valid_targets_mean": 2842.1,
"valid_targets_min": 948
},
{
"epoch": 0.3328050713153724,
"grad_norm": 0.8073270397360635,
"learning_rate": 1.891402714932127e-05,
"loss": 0.5039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5106959342956543,
"step": 210,
"valid_targets_mean": 3173.0,
"valid_targets_min": 1091
},
{
"epoch": 0.34072900158478603,
"grad_norm": 0.8240792568108604,
"learning_rate": 1.9366515837104074e-05,
"loss": 0.504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5431502461433411,
"step": 215,
"valid_targets_mean": 2898.2,
"valid_targets_min": 605
},
{
"epoch": 0.3486529318541997,
"grad_norm": 0.8295014877374133,
"learning_rate": 1.981900452488688e-05,
"loss": 0.5304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5582056045532227,
"step": 220,
"valid_targets_mean": 2875.2,
"valid_targets_min": 1271
},
{
"epoch": 0.35657686212361334,
"grad_norm": 2.271995482651572,
"learning_rate": 2.0271493212669683e-05,
"loss": 0.5235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.538544774055481,
"step": 225,
"valid_targets_mean": 2641.7,
"valid_targets_min": 959
},
{
"epoch": 0.36450079239302696,
"grad_norm": 0.8237389594967636,
"learning_rate": 2.072398190045249e-05,
"loss": 0.5407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5350701808929443,
"step": 230,
"valid_targets_mean": 3219.0,
"valid_targets_min": 1486
},
{
"epoch": 0.3724247226624406,
"grad_norm": 0.7959671331295798,
"learning_rate": 2.1176470588235296e-05,
"loss": 0.5032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5149205923080444,
"step": 235,
"valid_targets_mean": 2917.6,
"valid_targets_min": 1040
},
{
"epoch": 0.3803486529318542,
"grad_norm": 0.7671263696227919,
"learning_rate": 2.16289592760181e-05,
"loss": 0.5213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.541510283946991,
"step": 240,
"valid_targets_mean": 3337.9,
"valid_targets_min": 1126
},
{
"epoch": 0.38827258320126784,
"grad_norm": 0.8241086669277788,
"learning_rate": 2.2081447963800908e-05,
"loss": 0.5073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49820655584335327,
"step": 245,
"valid_targets_mean": 3259.1,
"valid_targets_min": 1129
},
{
"epoch": 0.39619651347068147,
"grad_norm": 0.8184305981195854,
"learning_rate": 2.2533936651583713e-05,
"loss": 0.5124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5349119901657104,
"step": 250,
"valid_targets_mean": 3188.1,
"valid_targets_min": 1113
},
{
"epoch": 0.4041204437400951,
"grad_norm": 0.7932024628401,
"learning_rate": 2.2986425339366517e-05,
"loss": 0.4913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5034860372543335,
"step": 255,
"valid_targets_mean": 2739.3,
"valid_targets_min": 1349
},
{
"epoch": 0.4120443740095087,
"grad_norm": 0.7551847650496477,
"learning_rate": 2.3438914027149325e-05,
"loss": 0.5018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4922025203704834,
"step": 260,
"valid_targets_mean": 3856.2,
"valid_targets_min": 1112
},
{
"epoch": 0.41996830427892234,
"grad_norm": 0.8505689875054292,
"learning_rate": 2.3891402714932127e-05,
"loss": 0.4818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48634108901023865,
"step": 265,
"valid_targets_mean": 3152.6,
"valid_targets_min": 984
},
{
"epoch": 0.42789223454833597,
"grad_norm": 0.772976426564909,
"learning_rate": 2.434389140271493e-05,
"loss": 0.4938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5387519001960754,
"step": 270,
"valid_targets_mean": 3622.1,
"valid_targets_min": 987
},
{
"epoch": 0.4358161648177496,
"grad_norm": 0.728717890666478,
"learning_rate": 2.479638009049774e-05,
"loss": 0.4837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4416227638721466,
"step": 275,
"valid_targets_mean": 3568.1,
"valid_targets_min": 870
},
{
"epoch": 0.4437400950871632,
"grad_norm": 0.7440381524213614,
"learning_rate": 2.5248868778280544e-05,
"loss": 0.4725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4643154740333557,
"step": 280,
"valid_targets_mean": 3414.1,
"valid_targets_min": 1170
},
{
"epoch": 0.45166402535657685,
"grad_norm": 0.8310009993608024,
"learning_rate": 2.5701357466063352e-05,
"loss": 0.508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5839574933052063,
"step": 285,
"valid_targets_mean": 3222.6,
"valid_targets_min": 1309
},
{
"epoch": 0.4595879556259905,
"grad_norm": 1.0056080573653239,
"learning_rate": 2.6153846153846157e-05,
"loss": 0.503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5559020042419434,
"step": 290,
"valid_targets_mean": 2088.1,
"valid_targets_min": 904
},
{
"epoch": 0.4675118858954041,
"grad_norm": 0.7408460822295689,
"learning_rate": 2.660633484162896e-05,
"loss": 0.4563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.485029399394989,
"step": 295,
"valid_targets_mean": 3781.1,
"valid_targets_min": 1262
},
{
"epoch": 0.4754358161648177,
"grad_norm": 0.8762884446062088,
"learning_rate": 2.705882352941177e-05,
"loss": 0.4595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4712425470352173,
"step": 300,
"valid_targets_mean": 2533.3,
"valid_targets_min": 1219
},
{
"epoch": 0.48335974643423135,
"grad_norm": 0.848146038346364,
"learning_rate": 2.7511312217194574e-05,
"loss": 0.4776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40771573781967163,
"step": 305,
"valid_targets_mean": 3576.4,
"valid_targets_min": 1520
},
{
"epoch": 0.49128367670364503,
"grad_norm": 0.9694638564949015,
"learning_rate": 2.7963800904977375e-05,
"loss": 0.4906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4891023337841034,
"step": 310,
"valid_targets_mean": 2688.9,
"valid_targets_min": 1303
},
{
"epoch": 0.49920760697305866,
"grad_norm": 1.0834078584446678,
"learning_rate": 2.8416289592760183e-05,
"loss": 0.4946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4841890335083008,
"step": 315,
"valid_targets_mean": 3407.0,
"valid_targets_min": 809
},
{
"epoch": 0.5071315372424723,
"grad_norm": 0.9122194804424244,
"learning_rate": 2.8868778280542988e-05,
"loss": 0.4741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47857069969177246,
"step": 320,
"valid_targets_mean": 2495.8,
"valid_targets_min": 1338
},
{
"epoch": 0.5150554675118859,
"grad_norm": 0.9343811207818954,
"learning_rate": 2.9321266968325792e-05,
"loss": 0.482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4668818712234497,
"step": 325,
"valid_targets_mean": 2979.8,
"valid_targets_min": 1365
},
{
"epoch": 0.5229793977812995,
"grad_norm": 0.9068833355782842,
"learning_rate": 2.97737556561086e-05,
"loss": 0.4667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4718451499938965,
"step": 330,
"valid_targets_mean": 2903.4,
"valid_targets_min": 1354
},
{
"epoch": 0.5309033280507132,
"grad_norm": 0.7990682092269628,
"learning_rate": 3.0226244343891405e-05,
"loss": 0.5061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5103294849395752,
"step": 335,
"valid_targets_mean": 2843.9,
"valid_targets_min": 323
},
{
"epoch": 0.5388272583201268,
"grad_norm": 0.8690173421542774,
"learning_rate": 3.067873303167421e-05,
"loss": 0.4835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5316380262374878,
"step": 340,
"valid_targets_mean": 2980.1,
"valid_targets_min": 926
},
{
"epoch": 0.5467511885895404,
"grad_norm": 0.9164824781790208,
"learning_rate": 3.1131221719457014e-05,
"loss": 0.5017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4985496699810028,
"step": 345,
"valid_targets_mean": 2905.6,
"valid_targets_min": 1131
},
{
"epoch": 0.554675118858954,
"grad_norm": 0.953530103945049,
"learning_rate": 3.158371040723982e-05,
"loss": 0.5038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.506258487701416,
"step": 350,
"valid_targets_mean": 2239.8,
"valid_targets_min": 968
},
{
"epoch": 0.5625990491283677,
"grad_norm": 0.831534497185613,
"learning_rate": 3.203619909502263e-05,
"loss": 0.4813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4679664373397827,
"step": 355,
"valid_targets_mean": 2892.7,
"valid_targets_min": 742
},
{
"epoch": 0.5705229793977813,
"grad_norm": 0.9297214655733225,
"learning_rate": 3.248868778280543e-05,
"loss": 0.4977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5199379920959473,
"step": 360,
"valid_targets_mean": 2508.0,
"valid_targets_min": 944
},
{
"epoch": 0.5784469096671949,
"grad_norm": 0.7980105320092034,
"learning_rate": 3.294117647058824e-05,
"loss": 0.4842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4856064021587372,
"step": 365,
"valid_targets_mean": 3416.5,
"valid_targets_min": 1289
},
{
"epoch": 0.5863708399366085,
"grad_norm": 0.7614084262261346,
"learning_rate": 3.339366515837105e-05,
"loss": 0.4761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4349548816680908,
"step": 370,
"valid_targets_mean": 3276.8,
"valid_targets_min": 994
},
{
"epoch": 0.5942947702060222,
"grad_norm": 0.750217913881111,
"learning_rate": 3.384615384615385e-05,
"loss": 0.4981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5112859606742859,
"step": 375,
"valid_targets_mean": 3364.1,
"valid_targets_min": 949
},
{
"epoch": 0.6022187004754358,
"grad_norm": 0.9079283778370618,
"learning_rate": 3.429864253393665e-05,
"loss": 0.4827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5121220946311951,
"step": 380,
"valid_targets_mean": 2648.1,
"valid_targets_min": 1194
},
{
"epoch": 0.6101426307448494,
"grad_norm": 0.8438307201472272,
"learning_rate": 3.475113122171946e-05,
"loss": 0.474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47371935844421387,
"step": 385,
"valid_targets_mean": 3062.8,
"valid_targets_min": 1584
},
{
"epoch": 0.618066561014263,
"grad_norm": 0.7638788394514087,
"learning_rate": 3.5203619909502266e-05,
"loss": 0.4903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46218085289001465,
"step": 390,
"valid_targets_mean": 3355.6,
"valid_targets_min": 1171
},
{
"epoch": 0.6259904912836767,
"grad_norm": 0.8057208518874918,
"learning_rate": 3.5656108597285074e-05,
"loss": 0.4516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4557874798774719,
"step": 395,
"valid_targets_mean": 2975.8,
"valid_targets_min": 1180
},
{
"epoch": 0.6339144215530903,
"grad_norm": 0.8047504969731512,
"learning_rate": 3.6108597285067875e-05,
"loss": 0.506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5088905096054077,
"step": 400,
"valid_targets_mean": 3338.4,
"valid_targets_min": 1134
},
{
"epoch": 0.6418383518225039,
"grad_norm": 0.7333017715853949,
"learning_rate": 3.656108597285068e-05,
"loss": 0.438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40402841567993164,
"step": 405,
"valid_targets_mean": 3842.2,
"valid_targets_min": 1351
},
{
"epoch": 0.6497622820919176,
"grad_norm": 0.8399572940800708,
"learning_rate": 3.701357466063349e-05,
"loss": 0.5022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48715096712112427,
"step": 410,
"valid_targets_mean": 3547.1,
"valid_targets_min": 1158
},
{
"epoch": 0.6576862123613312,
"grad_norm": 0.6829367274200412,
"learning_rate": 3.746606334841629e-05,
"loss": 0.4701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4927830994129181,
"step": 415,
"valid_targets_mean": 4532.0,
"valid_targets_min": 1815
},
{
"epoch": 0.6656101426307448,
"grad_norm": 0.7331801766359471,
"learning_rate": 3.791855203619909e-05,
"loss": 0.4813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4546471834182739,
"step": 420,
"valid_targets_mean": 3296.0,
"valid_targets_min": 1238
},
{
"epoch": 0.6735340729001584,
"grad_norm": 0.6517565900289717,
"learning_rate": 3.837104072398191e-05,
"loss": 0.4519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3863980174064636,
"step": 425,
"valid_targets_mean": 3856.7,
"valid_targets_min": 1241
},
{
"epoch": 0.6814580031695721,
"grad_norm": 0.7230595741095671,
"learning_rate": 3.882352941176471e-05,
"loss": 0.4603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4377797544002533,
"step": 430,
"valid_targets_mean": 3500.8,
"valid_targets_min": 1413
},
{
"epoch": 0.6893819334389857,
"grad_norm": 0.8116424062683696,
"learning_rate": 3.927601809954751e-05,
"loss": 0.478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48108479380607605,
"step": 435,
"valid_targets_mean": 2934.9,
"valid_targets_min": 1263
},
{
"epoch": 0.6973058637083994,
"grad_norm": 0.7795795329155563,
"learning_rate": 3.972850678733032e-05,
"loss": 0.4656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4403081238269806,
"step": 440,
"valid_targets_mean": 2962.6,
"valid_targets_min": 973
},
{
"epoch": 0.705229793977813,
"grad_norm": 0.7200947601229617,
"learning_rate": 3.99999750146533e-05,
"loss": 0.4536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4119512438774109,
"step": 445,
"valid_targets_mean": 3470.1,
"valid_targets_min": 666
},
{
"epoch": 0.7131537242472267,
"grad_norm": 0.7628047573152018,
"learning_rate": 3.999969393021975e-05,
"loss": 0.4598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4884294271469116,
"step": 450,
"valid_targets_mean": 3419.0,
"valid_targets_min": 933
},
{
"epoch": 0.7210776545166403,
"grad_norm": 0.7380251751146455,
"learning_rate": 3.999910053407327e-05,
"loss": 0.4637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48761463165283203,
"step": 455,
"valid_targets_mean": 4100.1,
"valid_targets_min": 1287
},
{
"epoch": 0.7290015847860539,
"grad_norm": 0.9308179330317129,
"learning_rate": 3.999819483548022e-05,
"loss": 0.4695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4577655792236328,
"step": 460,
"valid_targets_mean": 2391.7,
"valid_targets_min": 1138
},
{
"epoch": 0.7369255150554676,
"grad_norm": 0.7825831726322529,
"learning_rate": 3.999697684858384e-05,
"loss": 0.4776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48154550790786743,
"step": 465,
"valid_targets_mean": 3380.8,
"valid_targets_min": 1034
},
{
"epoch": 0.7448494453248812,
"grad_norm": 0.6672464690362646,
"learning_rate": 3.9995446592403994e-05,
"loss": 0.462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43639689683914185,
"step": 470,
"valid_targets_mean": 3831.9,
"valid_targets_min": 995
},
{
"epoch": 0.7527733755942948,
"grad_norm": 0.8243105277532876,
"learning_rate": 3.9993604090836905e-05,
"loss": 0.4321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47002795338630676,
"step": 475,
"valid_targets_mean": 3040.6,
"valid_targets_min": 917
},
{
"epoch": 0.7606973058637084,
"grad_norm": 0.761930542283936,
"learning_rate": 3.999144937265473e-05,
"loss": 0.4752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46109023690223694,
"step": 480,
"valid_targets_mean": 3145.6,
"valid_targets_min": 1514
},
{
"epoch": 0.768621236133122,
"grad_norm": 0.8060589330068717,
"learning_rate": 3.998898247150519e-05,
"loss": 0.4463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4293675720691681,
"step": 485,
"valid_targets_mean": 2624.5,
"valid_targets_min": 875
},
{
"epoch": 0.7765451664025357,
"grad_norm": 0.7239375292351515,
"learning_rate": 3.9986203425910976e-05,
"loss": 0.4541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49284249544143677,
"step": 490,
"valid_targets_mean": 3257.3,
"valid_targets_min": 1477
},
{
"epoch": 0.7844690966719493,
"grad_norm": 0.661893236239374,
"learning_rate": 3.998311227926918e-05,
"loss": 0.4455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4618075489997864,
"step": 495,
"valid_targets_mean": 3975.6,
"valid_targets_min": 1167
},
{
"epoch": 0.7923930269413629,
"grad_norm": 0.7934924986420486,
"learning_rate": 3.997970907985059e-05,
"loss": 0.5113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5001330375671387,
"step": 500,
"valid_targets_mean": 2784.4,
"valid_targets_min": 1326
},
{
"epoch": 0.8003169572107766,
"grad_norm": 0.8975772569125601,
"learning_rate": 3.9975993880799e-05,
"loss": 0.4497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42663824558258057,
"step": 505,
"valid_targets_mean": 2079.9,
"valid_targets_min": 918
},
{
"epoch": 0.8082408874801902,
"grad_norm": 0.6568781194669023,
"learning_rate": 3.9971966740130284e-05,
"loss": 0.4495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46053969860076904,
"step": 510,
"valid_targets_mean": 3603.1,
"valid_targets_min": 1018
},
{
"epoch": 0.8161648177496038,
"grad_norm": 0.6658645533938224,
"learning_rate": 3.996762772073156e-05,
"loss": 0.4417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4799339771270752,
"step": 515,
"valid_targets_mean": 4443.3,
"valid_targets_min": 1201
},
{
"epoch": 0.8240887480190174,
"grad_norm": 0.8120691967226177,
"learning_rate": 3.996297689036022e-05,
"loss": 0.4691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5048344731330872,
"step": 520,
"valid_targets_mean": 2798.8,
"valid_targets_min": 982
},
{
"epoch": 0.8320126782884311,
"grad_norm": 0.7585539749107885,
"learning_rate": 3.995801432164279e-05,
"loss": 0.4741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42256441712379456,
"step": 525,
"valid_targets_mean": 2953.5,
"valid_targets_min": 1244
},
{
"epoch": 0.8399366085578447,
"grad_norm": 0.7627360477522009,
"learning_rate": 3.9952740092073895e-05,
"loss": 0.4474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45900869369506836,
"step": 530,
"valid_targets_mean": 2668.1,
"valid_targets_min": 1356
},
{
"epoch": 0.8478605388272583,
"grad_norm": 0.7233384200007872,
"learning_rate": 3.9947154284014955e-05,
"loss": 0.472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46540921926498413,
"step": 535,
"valid_targets_mean": 3327.3,
"valid_targets_min": 956
},
{
"epoch": 0.8557844690966719,
"grad_norm": 0.8462825976473535,
"learning_rate": 3.994125698469298e-05,
"loss": 0.4679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44462665915489197,
"step": 540,
"valid_targets_mean": 2309.5,
"valid_targets_min": 839
},
{
"epoch": 0.8637083993660856,
"grad_norm": 0.7523146524714103,
"learning_rate": 3.9935048286199166e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4704914391040802,
"step": 545,
"valid_targets_mean": 3301.1,
"valid_targets_min": 896
},
{
"epoch": 0.8716323296354992,
"grad_norm": 0.7323342838512769,
"learning_rate": 3.992852828548745e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43246427178382874,
"step": 550,
"valid_targets_mean": 3083.8,
"valid_targets_min": 592
},
{
"epoch": 0.8795562599049128,
"grad_norm": 0.7835802807257946,
"learning_rate": 3.992169708437304e-05,
"loss": 0.4496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42524343729019165,
"step": 555,
"valid_targets_mean": 2537.8,
"valid_targets_min": 805
},
{
"epoch": 0.8874801901743264,
"grad_norm": 0.8164094838303196,
"learning_rate": 3.9914554789530753e-05,
"loss": 0.4494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4827771782875061,
"step": 560,
"valid_targets_mean": 3152.2,
"valid_targets_min": 1026
},
{
"epoch": 0.8954041204437401,
"grad_norm": 0.6690559963612506,
"learning_rate": 3.990710151249342e-05,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4192623496055603,
"step": 565,
"valid_targets_mean": 3655.5,
"valid_targets_min": 1219
},
{
"epoch": 0.9033280507131537,
"grad_norm": 0.6580359416743707,
"learning_rate": 3.989933736965011e-05,
"loss": 0.4577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4300585389137268,
"step": 570,
"valid_targets_mean": 4057.7,
"valid_targets_min": 762
},
{
"epoch": 0.9112519809825673,
"grad_norm": 0.8064570151818262,
"learning_rate": 3.9891262482244315e-05,
"loss": 0.4571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49867746233940125,
"step": 575,
"valid_targets_mean": 2577.3,
"valid_targets_min": 917
},
{
"epoch": 0.919175911251981,
"grad_norm": 0.7851899897385263,
"learning_rate": 3.988287697637206e-05,
"loss": 0.4444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5172279477119446,
"step": 580,
"valid_targets_mean": 3265.5,
"valid_targets_min": 929
},
{
"epoch": 0.9270998415213946,
"grad_norm": 0.7641647370399206,
"learning_rate": 3.987418098297993e-05,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4322676360607147,
"step": 585,
"valid_targets_mean": 2695.2,
"valid_targets_min": 1420
},
{
"epoch": 0.9350237717908082,
"grad_norm": 0.7323141223552216,
"learning_rate": 3.986517463786304e-05,
"loss": 0.4142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4049820899963379,
"step": 590,
"valid_targets_mean": 2684.9,
"valid_targets_min": 1028
},
{
"epoch": 0.9429477020602218,
"grad_norm": 0.7633256320545897,
"learning_rate": 3.985585808166289e-05,
"loss": 0.4453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4967576563358307,
"step": 595,
"valid_targets_mean": 2754.4,
"valid_targets_min": 1337
},
{
"epoch": 0.9508716323296355,
"grad_norm": 0.7629796008373017,
"learning_rate": 3.9846231459865195e-05,
"loss": 0.4256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43822014331817627,
"step": 600,
"valid_targets_mean": 2671.6,
"valid_targets_min": 1143
},
{
"epoch": 0.9587955625990491,
"grad_norm": 0.8958552133877844,
"learning_rate": 3.983629492279759e-05,
"loss": 0.4518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48023688793182373,
"step": 605,
"valid_targets_mean": 2614.1,
"valid_targets_min": 1174
},
{
"epoch": 0.9667194928684627,
"grad_norm": 0.6996692976043973,
"learning_rate": 3.982604862562729e-05,
"loss": 0.4385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44010189175605774,
"step": 610,
"valid_targets_mean": 3366.1,
"valid_targets_min": 1220
},
{
"epoch": 0.9746434231378764,
"grad_norm": 0.6660341248169072,
"learning_rate": 3.9815492728358674e-05,
"loss": 0.4333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4266677498817444,
"step": 615,
"valid_targets_mean": 3921.9,
"valid_targets_min": 878
},
{
"epoch": 0.9825673534072901,
"grad_norm": 0.9292017152796667,
"learning_rate": 3.980462739583079e-05,
"loss": 0.4216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40375131368637085,
"step": 620,
"valid_targets_mean": 2191.8,
"valid_targets_min": 941
},
{
"epoch": 0.9904912836767037,
"grad_norm": 0.7664309991122322,
"learning_rate": 3.9793452797714765e-05,
"loss": 0.4152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4360402524471283,
"step": 625,
"valid_targets_mean": 3167.6,
"valid_targets_min": 883
},
{
"epoch": 0.9984152139461173,
"grad_norm": 0.762176105418411,
"learning_rate": 3.9781969108511156e-05,
"loss": 0.4323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4275134801864624,
"step": 630,
"valid_targets_mean": 2764.2,
"valid_targets_min": 832
},
{
"epoch": 1.006339144215531,
"grad_norm": 0.704479878187583,
"learning_rate": 3.9770176507547246e-05,
"loss": 0.4287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41019442677497864,
"step": 635,
"valid_targets_mean": 4324.3,
"valid_targets_min": 1450
},
{
"epoch": 1.0142630744849446,
"grad_norm": 0.9019061125405019,
"learning_rate": 3.975807517897422e-05,
"loss": 0.4257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3917194604873657,
"step": 640,
"valid_targets_mean": 2455.1,
"valid_targets_min": 1134
},
{
"epoch": 1.0221870047543582,
"grad_norm": 0.8978043885613115,
"learning_rate": 3.9745665311764305e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4289025664329529,
"step": 645,
"valid_targets_mean": 2416.1,
"valid_targets_min": 891
},
{
"epoch": 1.0301109350237718,
"grad_norm": 0.7816645884156189,
"learning_rate": 3.973294709970781e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4417671263217926,
"step": 650,
"valid_targets_mean": 2768.1,
"valid_targets_min": 932
},
{
"epoch": 1.0380348652931854,
"grad_norm": 0.718601192352368,
"learning_rate": 3.97199207414101e-05,
"loss": 0.4231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40946125984191895,
"step": 655,
"valid_targets_mean": 3722.6,
"valid_targets_min": 926
},
{
"epoch": 1.045958795562599,
"grad_norm": 0.84427108743179,
"learning_rate": 3.970658644028851e-05,
"loss": 0.4549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46118617057800293,
"step": 660,
"valid_targets_mean": 2638.7,
"valid_targets_min": 832
},
{
"epoch": 1.0538827258320127,
"grad_norm": 0.860139409056787,
"learning_rate": 3.969294440456915e-05,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43523386120796204,
"step": 665,
"valid_targets_mean": 2739.1,
"valid_targets_min": 1231
},
{
"epoch": 1.0618066561014263,
"grad_norm": 0.7097427943901892,
"learning_rate": 3.9678994847283636e-05,
"loss": 0.4183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3999113142490387,
"step": 670,
"valid_targets_mean": 3927.4,
"valid_targets_min": 1556
},
{
"epoch": 1.06973058637084,
"grad_norm": 0.7042143614988474,
"learning_rate": 3.9664737986265825e-05,
"loss": 0.4003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3503003418445587,
"step": 675,
"valid_targets_mean": 3451.0,
"valid_targets_min": 1132
},
{
"epoch": 1.0776545166402536,
"grad_norm": 0.797726052806819,
"learning_rate": 3.9650174044148364e-05,
"loss": 0.4136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4306812882423401,
"step": 680,
"valid_targets_mean": 2851.7,
"valid_targets_min": 972
},
{
"epoch": 1.0855784469096672,
"grad_norm": 0.7997403365127854,
"learning_rate": 3.9635303248359206e-05,
"loss": 0.4343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4064903259277344,
"step": 685,
"valid_targets_mean": 3858.1,
"valid_targets_min": 828
},
{
"epoch": 1.0935023771790808,
"grad_norm": 0.741920647282534,
"learning_rate": 3.9620125831118105e-05,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42814987897872925,
"step": 690,
"valid_targets_mean": 3245.4,
"valid_targets_min": 1067
},
{
"epoch": 1.1014263074484945,
"grad_norm": 0.8105775677772558,
"learning_rate": 3.960464202943293e-05,
"loss": 0.4221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42513906955718994,
"step": 695,
"valid_targets_mean": 2785.9,
"valid_targets_min": 1048
},
{
"epoch": 1.109350237717908,
"grad_norm": 0.7115809927579022,
"learning_rate": 3.958885208509601e-05,
"loss": 0.4217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41410183906555176,
"step": 700,
"valid_targets_mean": 3303.6,
"valid_targets_min": 1311
},
{
"epoch": 1.1172741679873217,
"grad_norm": 0.6566885854355542,
"learning_rate": 3.957275624468037e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3849619925022125,
"step": 705,
"valid_targets_mean": 3675.2,
"valid_targets_min": 1298
},
{
"epoch": 1.1251980982567353,
"grad_norm": 0.7159393546972551,
"learning_rate": 3.9556354759535806e-05,
"loss": 0.3989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3957841694355011,
"step": 710,
"valid_targets_mean": 3910.0,
"valid_targets_min": 1085
},
{
"epoch": 1.133122028526149,
"grad_norm": 0.654787326318881,
"learning_rate": 3.9539647885785056e-05,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42849165201187134,
"step": 715,
"valid_targets_mean": 4003.0,
"valid_targets_min": 1117
},
{
"epoch": 1.1410459587955626,
"grad_norm": 0.692869210178711,
"learning_rate": 3.952263588431971e-05,
"loss": 0.4155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3946205675601959,
"step": 720,
"valid_targets_mean": 3680.2,
"valid_targets_min": 734
},
{
"epoch": 1.1489698890649762,
"grad_norm": 0.8061172018614384,
"learning_rate": 3.950531902079622e-05,
"loss": 0.3988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40015098452568054,
"step": 725,
"valid_targets_mean": 3444.4,
"valid_targets_min": 1252
},
{
"epoch": 1.1568938193343898,
"grad_norm": 0.7318031830672799,
"learning_rate": 3.948769756563167e-05,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3930429220199585,
"step": 730,
"valid_targets_mean": 3201.9,
"valid_targets_min": 666
},
{
"epoch": 1.1648177496038035,
"grad_norm": 0.612779900383534,
"learning_rate": 3.9469771793999625e-05,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4050843119621277,
"step": 735,
"valid_targets_mean": 4257.2,
"valid_targets_min": 1484
},
{
"epoch": 1.172741679873217,
"grad_norm": 0.7408822062660686,
"learning_rate": 3.9451541985825786e-05,
"loss": 0.4364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3889385163784027,
"step": 740,
"valid_targets_mean": 3084.0,
"valid_targets_min": 925
},
{
"epoch": 1.1806656101426307,
"grad_norm": 0.8417691654111226,
"learning_rate": 3.9433008425783644e-05,
"loss": 0.4036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39221471548080444,
"step": 745,
"valid_targets_mean": 2542.4,
"valid_targets_min": 824
},
{
"epoch": 1.1885895404120443,
"grad_norm": 0.8455649038780431,
"learning_rate": 3.941417140329002e-05,
"loss": 0.4236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41412001848220825,
"step": 750,
"valid_targets_mean": 2310.1,
"valid_targets_min": 692
},
{
"epoch": 1.196513470681458,
"grad_norm": 0.8023487927804567,
"learning_rate": 3.939503121250055e-05,
"loss": 0.4444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4537830054759979,
"step": 755,
"valid_targets_mean": 2984.4,
"valid_targets_min": 1263
},
{
"epoch": 1.2044374009508716,
"grad_norm": 0.836410102281734,
"learning_rate": 3.937558815230511e-05,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41315758228302,
"step": 760,
"valid_targets_mean": 2404.2,
"valid_targets_min": 1275
},
{
"epoch": 1.2123613312202852,
"grad_norm": 0.7687019899235902,
"learning_rate": 3.935584252632311e-05,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4471081495285034,
"step": 765,
"valid_targets_mean": 3286.8,
"valid_targets_min": 881
},
{
"epoch": 1.2202852614896988,
"grad_norm": 0.8076276401226896,
"learning_rate": 3.933579464289877e-05,
"loss": 0.4229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44439810514450073,
"step": 770,
"valid_targets_mean": 2975.2,
"valid_targets_min": 605
},
{
"epoch": 1.2282091917591125,
"grad_norm": 0.6761174721765739,
"learning_rate": 3.931544481509634e-05,
"loss": 0.4123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3570912480354309,
"step": 775,
"valid_targets_mean": 3133.5,
"valid_targets_min": 1202
},
{
"epoch": 1.236133122028526,
"grad_norm": 0.6540995614498064,
"learning_rate": 3.929479336069515e-05,
"loss": 0.4087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4113902449607849,
"step": 780,
"valid_targets_mean": 3971.6,
"valid_targets_min": 1882
},
{
"epoch": 1.2440570522979397,
"grad_norm": 0.7555222122842105,
"learning_rate": 3.9273840602184704e-05,
"loss": 0.4283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.415526807308197,
"step": 785,
"valid_targets_mean": 2650.9,
"valid_targets_min": 1373
},
{
"epoch": 1.2519809825673534,
"grad_norm": 0.7338778533435747,
"learning_rate": 3.925258686675959e-05,
"loss": 0.4202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4193318486213684,
"step": 790,
"valid_targets_mean": 3284.5,
"valid_targets_min": 729
},
{
"epoch": 1.259904912836767,
"grad_norm": 0.6821772996833774,
"learning_rate": 3.9231032486314424e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4240224063396454,
"step": 795,
"valid_targets_mean": 3689.0,
"valid_targets_min": 767
},
{
"epoch": 1.2678288431061806,
"grad_norm": 0.6846368831579128,
"learning_rate": 3.920917779743863e-05,
"loss": 0.4251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3829592764377594,
"step": 800,
"valid_targets_mean": 3325.4,
"valid_targets_min": 1102
},
{
"epoch": 1.2757527733755942,
"grad_norm": 0.6659668031255094,
"learning_rate": 3.9187023141411174e-05,
"loss": 0.4236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38867223262786865,
"step": 805,
"valid_targets_mean": 3416.3,
"valid_targets_min": 1262
},
{
"epoch": 1.2836767036450079,
"grad_norm": 0.7285809624299453,
"learning_rate": 3.916456886419531e-05,
"loss": 0.4231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3913799822330475,
"step": 810,
"valid_targets_mean": 3115.3,
"valid_targets_min": 1613
},
{
"epoch": 1.2916006339144215,
"grad_norm": 0.6294190021912572,
"learning_rate": 3.914181531643308e-05,
"loss": 0.4208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40710440278053284,
"step": 815,
"valid_targets_mean": 4045.3,
"valid_targets_min": 1010
},
{
"epoch": 1.299524564183835,
"grad_norm": 0.6395002952830273,
"learning_rate": 3.9118762853439896e-05,
"loss": 0.4159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38787251710891724,
"step": 820,
"valid_targets_mean": 3804.1,
"valid_targets_min": 1352
},
{
"epoch": 1.3074484944532487,
"grad_norm": 0.8584841420313233,
"learning_rate": 3.909541183519897e-05,
"loss": 0.3973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44322896003723145,
"step": 825,
"valid_targets_mean": 2552.2,
"valid_targets_min": 1167
},
{
"epoch": 1.3153724247226624,
"grad_norm": 0.8556648774974849,
"learning_rate": 3.907176262635573e-05,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4341663718223572,
"step": 830,
"valid_targets_mean": 2628.5,
"valid_targets_min": 1103
},
{
"epoch": 1.3232963549920762,
"grad_norm": 0.7234909908437245,
"learning_rate": 3.904781559621205e-05,
"loss": 0.3865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39154618978500366,
"step": 835,
"valid_targets_mean": 3121.8,
"valid_targets_min": 1013
},
{
"epoch": 1.3312202852614896,
"grad_norm": 0.8559159891089542,
"learning_rate": 3.9023571118720556e-05,
"loss": 0.4387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.451394259929657,
"step": 840,
"valid_targets_mean": 3243.3,
"valid_targets_min": 1096
},
{
"epoch": 1.3391442155309035,
"grad_norm": 0.6960908027565411,
"learning_rate": 3.899902957247876e-05,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4584362208843231,
"step": 845,
"valid_targets_mean": 3875.6,
"valid_targets_min": 790
},
{
"epoch": 1.3470681458003169,
"grad_norm": 0.7088383534291515,
"learning_rate": 3.8974191340723156e-05,
"loss": 0.4269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4132707118988037,
"step": 850,
"valid_targets_mean": 3384.2,
"valid_targets_min": 820
},
{
"epoch": 1.3549920760697307,
"grad_norm": 0.9002448432474283,
"learning_rate": 3.89490568113232e-05,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4581453502178192,
"step": 855,
"valid_targets_mean": 2567.9,
"valid_targets_min": 907
},
{
"epoch": 1.3629160063391441,
"grad_norm": 0.8733397713665929,
"learning_rate": 3.8923626376775304e-05,
"loss": 0.4174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38375404477119446,
"step": 860,
"valid_targets_mean": 2163.6,
"valid_targets_min": 1028
},
{
"epoch": 1.370839936608558,
"grad_norm": 0.7437113903348465,
"learning_rate": 3.889790043419667e-05,
"loss": 0.3846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39502203464508057,
"step": 865,
"valid_targets_mean": 2958.6,
"valid_targets_min": 928
},
{
"epoch": 1.3787638668779714,
"grad_norm": 0.8343548930808327,
"learning_rate": 3.88718793853191e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3916308283805847,
"step": 870,
"valid_targets_mean": 2949.1,
"valid_targets_min": 1143
},
{
"epoch": 1.3866877971473852,
"grad_norm": 0.7516211189853197,
"learning_rate": 3.884556363648274e-05,
"loss": 0.4079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39778488874435425,
"step": 875,
"valid_targets_mean": 3050.1,
"valid_targets_min": 1425
},
{
"epoch": 1.3946117274167986,
"grad_norm": 1.9122478361363395,
"learning_rate": 3.881895359862971e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3751554489135742,
"step": 880,
"valid_targets_mean": 3727.2,
"valid_targets_min": 1411
},
{
"epoch": 1.4025356576862125,
"grad_norm": 0.8283328429349839,
"learning_rate": 3.8792049687297676e-05,
"loss": 0.429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4410147964954376,
"step": 885,
"valid_targets_mean": 2555.6,
"valid_targets_min": 1352
},
{
"epoch": 1.4104595879556259,
"grad_norm": 0.7964713017148128,
"learning_rate": 3.8764852322613424e-05,
"loss": 0.3962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4192018508911133,
"step": 890,
"valid_targets_mean": 2898.3,
"valid_targets_min": 1409
},
{
"epoch": 1.4183835182250397,
"grad_norm": 0.9240073279538392,
"learning_rate": 3.873736192928621e-05,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4372017979621887,
"step": 895,
"valid_targets_mean": 2696.7,
"valid_targets_min": 756
},
{
"epoch": 1.4263074484944531,
"grad_norm": 0.83039785426173,
"learning_rate": 3.870957893660121e-05,
"loss": 0.3843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41866040229797363,
"step": 900,
"valid_targets_mean": 2210.3,
"valid_targets_min": 805
},
{
"epoch": 1.434231378763867,
"grad_norm": 0.80445295919421,
"learning_rate": 3.8681503778412755e-05,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4015462398529053,
"step": 905,
"valid_targets_mean": 2993.2,
"valid_targets_min": 1028
},
{
"epoch": 1.4421553090332804,
"grad_norm": 0.7688696814096964,
"learning_rate": 3.86531368931376e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4431518018245697,
"step": 910,
"valid_targets_mean": 2941.3,
"valid_targets_min": 1125
},
{
"epoch": 1.4500792393026942,
"grad_norm": 0.6998329358267783,
"learning_rate": 3.862447872374804e-05,
"loss": 0.4143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3961395025253296,
"step": 915,
"valid_targets_mean": 3132.4,
"valid_targets_min": 1155
},
{
"epoch": 1.4580031695721076,
"grad_norm": 0.7100699865804003,
"learning_rate": 3.859552971776503e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4128316044807434,
"step": 920,
"valid_targets_mean": 3220.7,
"valid_targets_min": 1136
},
{
"epoch": 1.4659270998415215,
"grad_norm": 0.724096649438488,
"learning_rate": 3.856629032725117e-05,
"loss": 0.4019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.413987398147583,
"step": 925,
"valid_targets_mean": 3048.2,
"valid_targets_min": 1512
},
{
"epoch": 1.473851030110935,
"grad_norm": 0.9087616628326457,
"learning_rate": 3.853676100880366e-05,
"loss": 0.4225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4310683012008667,
"step": 930,
"valid_targets_mean": 2377.6,
"valid_targets_min": 764
},
{
"epoch": 1.4817749603803487,
"grad_norm": 0.696626378789911,
"learning_rate": 3.8506942223547144e-05,
"loss": 0.4151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41933345794677734,
"step": 935,
"valid_targets_mean": 3630.8,
"valid_targets_min": 890
},
{
"epoch": 1.4896988906497624,
"grad_norm": 0.8254765290702623,
"learning_rate": 3.847683443712655e-05,
"loss": 0.4054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4006253480911255,
"step": 940,
"valid_targets_mean": 2531.5,
"valid_targets_min": 613
},
{
"epoch": 1.497622820919176,
"grad_norm": 0.6563699014476309,
"learning_rate": 3.844643811969979e-05,
"loss": 0.3964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3917093873023987,
"step": 945,
"valid_targets_mean": 3745.3,
"valid_targets_min": 1636
},
{
"epoch": 1.5055467511885894,
"grad_norm": 0.7034200261801405,
"learning_rate": 3.8415753745930434e-05,
"loss": 0.3836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37366852164268494,
"step": 950,
"valid_targets_mean": 3708.8,
"valid_targets_min": 1277
},
{
"epoch": 1.5134706814580032,
"grad_norm": 0.7068374328594914,
"learning_rate": 3.8384781794980266e-05,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3869531750679016,
"step": 955,
"valid_targets_mean": 3328.4,
"valid_targets_min": 1074
},
{
"epoch": 1.5213946117274166,
"grad_norm": 0.7395241815584156,
"learning_rate": 3.835352275050186e-05,
"loss": 0.4003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41180118918418884,
"step": 960,
"valid_targets_mean": 2738.5,
"valid_targets_min": 1475
},
{
"epoch": 1.5293185419968305,
"grad_norm": 0.8711264116280388,
"learning_rate": 3.832197710063095e-05,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45476359128952026,
"step": 965,
"valid_targets_mean": 2199.7,
"valid_targets_min": 933
},
{
"epoch": 1.537242472266244,
"grad_norm": 0.6703294555536304,
"learning_rate": 3.829014533797889e-05,
"loss": 0.4049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37091028690338135,
"step": 970,
"valid_targets_mean": 3504.9,
"valid_targets_min": 1036
},
{
"epoch": 1.5451664025356577,
"grad_norm": 0.686830221903586,
"learning_rate": 3.8258027959624896e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41083040833473206,
"step": 975,
"valid_targets_mean": 3011.7,
"valid_targets_min": 1312
},
{
"epoch": 1.5530903328050714,
"grad_norm": 0.7408376847260882,
"learning_rate": 3.822562546710831e-05,
"loss": 0.4002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4086455702781677,
"step": 980,
"valid_targets_mean": 2653.7,
"valid_targets_min": 882
},
{
"epoch": 1.561014263074485,
"grad_norm": 0.636239559181727,
"learning_rate": 3.8192938366420783e-05,
"loss": 0.4058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3559831380844116,
"step": 985,
"valid_targets_mean": 3844.6,
"valid_targets_min": 1435
},
{
"epoch": 1.5689381933438986,
"grad_norm": 0.7144101319476477,
"learning_rate": 3.815996716799834e-05,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4442058801651001,
"step": 990,
"valid_targets_mean": 3304.9,
"valid_targets_min": 1338
},
{
"epoch": 1.5768621236133122,
"grad_norm": 1.1225511402749522,
"learning_rate": 3.812671238671344e-05,
"loss": 0.4297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5221154093742371,
"step": 995,
"valid_targets_mean": 1934.2,
"valid_targets_min": 1198
},
{
"epoch": 1.5847860538827259,
"grad_norm": 0.649928936381306,
"learning_rate": 3.809317454186691e-05,
"loss": 0.3877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3804464042186737,
"step": 1000,
"valid_targets_mean": 3448.9,
"valid_targets_min": 1223
},
{
"epoch": 1.5927099841521395,
"grad_norm": 0.6846783313137514,
"learning_rate": 3.8059354157179856e-05,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37651345133781433,
"step": 1005,
"valid_targets_mean": 3401.1,
"valid_targets_min": 797
},
{
"epoch": 1.6006339144215531,
"grad_norm": 0.7693670022399335,
"learning_rate": 3.802525176078547e-05,
"loss": 0.4051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44831791520118713,
"step": 1010,
"valid_targets_mean": 2622.1,
"valid_targets_min": 965
},
{
"epoch": 1.6085578446909667,
"grad_norm": 0.6930287612571057,
"learning_rate": 3.7990867885220796e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35027647018432617,
"step": 1015,
"valid_targets_mean": 3623.8,
"valid_targets_min": 1302
},
{
"epoch": 1.6164817749603804,
"grad_norm": 0.687012918482246,
"learning_rate": 3.7956203067418404e-05,
"loss": 0.4078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3655385673046112,
"step": 1020,
"valid_targets_mean": 3311.2,
"valid_targets_min": 1444
},
{
"epoch": 1.624405705229794,
"grad_norm": 0.7482238561024599,
"learning_rate": 3.792125784869801e-05,
"loss": 0.3946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4137212634086609,
"step": 1025,
"valid_targets_mean": 3026.4,
"valid_targets_min": 1491
},
{
"epoch": 1.6323296354992076,
"grad_norm": 0.66746545382943,
"learning_rate": 3.788603277475802e-05,
"loss": 0.4134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41697245836257935,
"step": 1030,
"valid_targets_mean": 4302.0,
"valid_targets_min": 1413
},
{
"epoch": 1.6402535657686212,
"grad_norm": 0.753161569313501,
"learning_rate": 3.785052839566701e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4113873243331909,
"step": 1035,
"valid_targets_mean": 2856.5,
"valid_targets_min": 1125
},
{
"epoch": 1.6481774960380349,
"grad_norm": 0.6546256771695564,
"learning_rate": 3.781474526585515e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.394817054271698,
"step": 1040,
"valid_targets_mean": 3403.2,
"valid_targets_min": 1422
},
{
"epoch": 1.6561014263074485,
"grad_norm": 0.7277585250229833,
"learning_rate": 3.777868394410549e-05,
"loss": 0.4284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47451382875442505,
"step": 1045,
"valid_targets_mean": 3198.6,
"valid_targets_min": 1517
},
{
"epoch": 1.6640253565768621,
"grad_norm": 0.7015006171574263,
"learning_rate": 3.774234499354534e-05,
"loss": 0.4044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39788326621055603,
"step": 1050,
"valid_targets_mean": 3490.7,
"valid_targets_min": 1153
},
{
"epoch": 1.6719492868462758,
"grad_norm": 0.8474760122796657,
"learning_rate": 3.7705728981637356e-05,
"loss": 0.4203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4005127549171448,
"step": 1055,
"valid_targets_mean": 2430.2,
"valid_targets_min": 1168
},
{
"epoch": 1.6798732171156894,
"grad_norm": 0.7000912329433476,
"learning_rate": 3.7668836480170766e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37566471099853516,
"step": 1060,
"valid_targets_mean": 3148.2,
"valid_targets_min": 742
},
{
"epoch": 1.687797147385103,
"grad_norm": 0.7518484582066471,
"learning_rate": 3.763166806525241e-05,
"loss": 0.411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4494781494140625,
"step": 1065,
"valid_targets_mean": 2883.8,
"valid_targets_min": 949
},
{
"epoch": 1.6957210776545166,
"grad_norm": 0.7045093699139731,
"learning_rate": 3.759422431729772e-05,
"loss": 0.4124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.360650897026062,
"step": 1070,
"valid_targets_mean": 2946.6,
"valid_targets_min": 1392
},
{
"epoch": 1.7036450079239303,
"grad_norm": 0.7676628810172328,
"learning_rate": 3.7556505821021716e-05,
"loss": 0.4324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4218803942203522,
"step": 1075,
"valid_targets_mean": 2905.9,
"valid_targets_min": 1305
},
{
"epoch": 1.7115689381933439,
"grad_norm": 0.8253811089122368,
"learning_rate": 3.751851316542981e-05,
"loss": 0.4057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3761538863182068,
"step": 1080,
"valid_targets_mean": 3308.4,
"valid_targets_min": 683
},
{
"epoch": 1.7194928684627575,
"grad_norm": 0.6654441883446629,
"learning_rate": 3.748024694380864e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3409106135368347,
"step": 1085,
"valid_targets_mean": 3397.1,
"valid_targets_min": 980
},
{
"epoch": 1.7274167987321711,
"grad_norm": 0.6484360369162916,
"learning_rate": 3.744170775371683e-05,
"loss": 0.3975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3883214294910431,
"step": 1090,
"valid_targets_mean": 3733.1,
"valid_targets_min": 1168
},
{
"epoch": 1.7353407290015848,
"grad_norm": 0.7031281814385612,
"learning_rate": 3.740289619697561e-05,
"loss": 0.4089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3461092710494995,
"step": 1095,
"valid_targets_mean": 3039.8,
"valid_targets_min": 511
},
{
"epoch": 1.7432646592709984,
"grad_norm": 0.8032936865207325,
"learning_rate": 3.736381287965943e-05,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41207650303840637,
"step": 1100,
"valid_targets_mean": 2640.8,
"valid_targets_min": 1094
},
{
"epoch": 1.751188589540412,
"grad_norm": 0.7024977935027796,
"learning_rate": 3.7324458412086547e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4368237853050232,
"step": 1105,
"valid_targets_mean": 3143.6,
"valid_targets_min": 1047
},
{
"epoch": 1.7591125198098256,
"grad_norm": 0.7123522087918879,
"learning_rate": 3.728483340880939e-05,
"loss": 0.3909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42601120471954346,
"step": 1110,
"valid_targets_mean": 3299.2,
"valid_targets_min": 1364
},
{
"epoch": 1.7670364500792393,
"grad_norm": 0.7419859314602727,
"learning_rate": 3.7244938488605084e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37845379114151,
"step": 1115,
"valid_targets_mean": 3138.9,
"valid_targets_min": 956
},
{
"epoch": 1.7749603803486529,
"grad_norm": 0.8181546771338208,
"learning_rate": 3.7204774274465694e-05,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43097904324531555,
"step": 1120,
"valid_targets_mean": 2586.9,
"valid_targets_min": 1087
},
{
"epoch": 1.7828843106180665,
"grad_norm": 0.6818665315017823,
"learning_rate": 3.716434139358855e-05,
"loss": 0.4197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40882283449172974,
"step": 1125,
"valid_targets_mean": 3429.4,
"valid_targets_min": 1192
},
{
"epoch": 1.7908082408874801,
"grad_norm": 0.8821106883318396,
"learning_rate": 3.712364047736643e-05,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38789087533950806,
"step": 1130,
"valid_targets_mean": 2882.9,
"valid_targets_min": 1102
},
{
"epoch": 1.7987321711568938,
"grad_norm": 0.6396888823145678,
"learning_rate": 3.7082672161377706e-05,
"loss": 0.4018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.375009685754776,
"step": 1135,
"valid_targets_mean": 3623.6,
"valid_targets_min": 1434
},
{
"epoch": 1.8066561014263076,
"grad_norm": 0.6985921775082531,
"learning_rate": 3.70414370853764e-05,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4500548243522644,
"step": 1140,
"valid_targets_mean": 3521.9,
"valid_targets_min": 1123
},
{
"epoch": 1.814580031695721,
"grad_norm": 0.6528447006130813,
"learning_rate": 3.6999935893282254e-05,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3747301697731018,
"step": 1145,
"valid_targets_mean": 3697.4,
"valid_targets_min": 1239
},
{
"epoch": 1.8225039619651349,
"grad_norm": 0.777122366373374,
"learning_rate": 3.695816923317058e-05,
"loss": 0.4189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3883894085884094,
"step": 1150,
"valid_targets_mean": 2929.1,
"valid_targets_min": 1149
},
{
"epoch": 1.8304278922345483,
"grad_norm": 0.7469966383617292,
"learning_rate": 3.691613775726223e-05,
"loss": 0.3863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4305916726589203,
"step": 1155,
"valid_targets_mean": 2614.3,
"valid_targets_min": 1168
},
{
"epoch": 1.8383518225039621,
"grad_norm": 0.6111573888862004,
"learning_rate": 3.687384212191336e-05,
"loss": 0.3952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3437587022781372,
"step": 1160,
"valid_targets_mean": 4098.4,
"valid_targets_min": 926
},
{
"epoch": 1.8462757527733755,
"grad_norm": 0.7266326774607562,
"learning_rate": 3.6831282987605185e-05,
"loss": 0.4203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39362356066703796,
"step": 1165,
"valid_targets_mean": 2666.9,
"valid_targets_min": 772
},
{
"epoch": 1.8541996830427894,
"grad_norm": 0.8846404507919211,
"learning_rate": 3.6788461018933695e-05,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37495893239974976,
"step": 1170,
"valid_targets_mean": 3182.8,
"valid_targets_min": 1724
},
{
"epoch": 1.8621236133122028,
"grad_norm": 0.7579090022128943,
"learning_rate": 3.674537688459924e-05,
"loss": 0.3982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41980457305908203,
"step": 1175,
"valid_targets_mean": 2550.7,
"valid_targets_min": 1142
},
{
"epoch": 1.8700475435816166,
"grad_norm": 0.8055268692496189,
"learning_rate": 3.67020312573961e-05,
"loss": 0.4301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4746722877025604,
"step": 1180,
"valid_targets_mean": 2543.4,
"valid_targets_min": 1425
},
{
"epoch": 1.87797147385103,
"grad_norm": 0.7072175582291216,
"learning_rate": 3.665842481420199e-05,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4191814064979553,
"step": 1185,
"valid_targets_mean": 3546.8,
"valid_targets_min": 1471
},
{
"epoch": 1.8858954041204439,
"grad_norm": 0.755666919283838,
"learning_rate": 3.661455823596749e-05,
"loss": 0.4235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41528838872909546,
"step": 1190,
"valid_targets_mean": 2681.6,
"valid_targets_min": 868
},
{
"epoch": 1.8938193343898573,
"grad_norm": 0.6908769369919235,
"learning_rate": 3.6570432207705366e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39453238248825073,
"step": 1195,
"valid_targets_mean": 3171.2,
"valid_targets_min": 807
},
{
"epoch": 1.9017432646592711,
"grad_norm": 0.6611245364364247,
"learning_rate": 3.652604741847996e-05,
"loss": 0.3746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3662848472595215,
"step": 1200,
"valid_targets_mean": 3316.7,
"valid_targets_min": 1167
},
{
"epoch": 1.9096671949286845,
"grad_norm": 0.5929280738291254,
"learning_rate": 3.648140456139635e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3568131625652313,
"step": 1205,
"valid_targets_mean": 3974.2,
"valid_targets_min": 1544
},
{
"epoch": 1.9175911251980984,
"grad_norm": 0.6945487108386357,
"learning_rate": 3.643650433358956e-05,
"loss": 0.3976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.376843124628067,
"step": 1210,
"valid_targets_mean": 2674.7,
"valid_targets_min": 1367
},
{
"epoch": 1.9255150554675118,
"grad_norm": 0.6712784164628189,
"learning_rate": 3.639134743621368e-05,
"loss": 0.4015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41648247838020325,
"step": 1215,
"valid_targets_mean": 3261.2,
"valid_targets_min": 1073
},
{
"epoch": 1.9334389857369256,
"grad_norm": 0.656538586479345,
"learning_rate": 3.63459345744309e-05,
"loss": 0.3785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3585965633392334,
"step": 1220,
"valid_targets_mean": 3355.2,
"valid_targets_min": 1300
},
{
"epoch": 1.941362916006339,
"grad_norm": 0.6904029377773084,
"learning_rate": 3.630026645740049e-05,
"loss": 0.4263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4165318012237549,
"step": 1225,
"valid_targets_mean": 2927.4,
"valid_targets_min": 1580
},
{
"epoch": 1.9492868462757529,
"grad_norm": 0.6679269706627182,
"learning_rate": 3.625434379826777e-05,
"loss": 0.4054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42261233925819397,
"step": 1230,
"valid_targets_mean": 3125.9,
"valid_targets_min": 1152
},
{
"epoch": 1.9572107765451663,
"grad_norm": 0.7041857593125621,
"learning_rate": 3.620816731415293e-05,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4373818039894104,
"step": 1235,
"valid_targets_mean": 3272.8,
"valid_targets_min": 852
},
{
"epoch": 1.9651347068145801,
"grad_norm": 0.7101332039778864,
"learning_rate": 3.616173772613985e-05,
"loss": 0.392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35600316524505615,
"step": 1240,
"valid_targets_mean": 2676.8,
"valid_targets_min": 1040
},
{
"epoch": 1.9730586370839935,
"grad_norm": 0.6634520936002515,
"learning_rate": 3.611505575926482e-05,
"loss": 0.4069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39966195821762085,
"step": 1245,
"valid_targets_mean": 3331.6,
"valid_targets_min": 951
},
{
"epoch": 1.9809825673534074,
"grad_norm": 0.6785145786730344,
"learning_rate": 3.6068122142505265e-05,
"loss": 0.3868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38170456886291504,
"step": 1250,
"valid_targets_mean": 2993.2,
"valid_targets_min": 1445
},
{
"epoch": 1.9889064976228208,
"grad_norm": 0.6316749595759299,
"learning_rate": 3.602093760876831e-05,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41541820764541626,
"step": 1255,
"valid_targets_mean": 4683.4,
"valid_targets_min": 1904
},
{
"epoch": 1.9968304278922346,
"grad_norm": 0.6421496174511931,
"learning_rate": 3.597350289487935e-05,
"loss": 0.3847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3562106490135193,
"step": 1260,
"valid_targets_mean": 3179.0,
"valid_targets_min": 804
},
{
"epoch": 2.004754358161648,
"grad_norm": 0.6676059687606999,
"learning_rate": 3.5925818741570566e-05,
"loss": 0.3712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2841273546218872,
"step": 1265,
"valid_targets_mean": 3497.7,
"valid_targets_min": 1563
},
{
"epoch": 2.012678288431062,
"grad_norm": 0.7062366601502383,
"learning_rate": 3.587788589346932e-05,
"loss": 0.3875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3702091574668884,
"step": 1270,
"valid_targets_mean": 3476.4,
"valid_targets_min": 904
},
{
"epoch": 2.0206022187004753,
"grad_norm": 0.7515066065460074,
"learning_rate": 3.5829705099086586e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3285125494003296,
"step": 1275,
"valid_targets_mean": 3045.9,
"valid_targets_min": 967
},
{
"epoch": 2.028526148969889,
"grad_norm": 0.6511406045365554,
"learning_rate": 3.578127711080517e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32423993945121765,
"step": 1280,
"valid_targets_mean": 3313.9,
"valid_targets_min": 1218
},
{
"epoch": 2.0364500792393025,
"grad_norm": 0.6629925563372985,
"learning_rate": 3.5732602684868065e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35224616527557373,
"step": 1285,
"valid_targets_mean": 3352.9,
"valid_targets_min": 945
},
{
"epoch": 2.0443740095087164,
"grad_norm": 0.6852450135475233,
"learning_rate": 3.568368258136657e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35313695669174194,
"step": 1290,
"valid_targets_mean": 3369.9,
"valid_targets_min": 778
},
{
"epoch": 2.05229793977813,
"grad_norm": 0.6804763117304029,
"learning_rate": 3.563451756422843e-05,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3494824171066284,
"step": 1295,
"valid_targets_mean": 3336.2,
"valid_targets_min": 1403
},
{
"epoch": 2.0602218700475436,
"grad_norm": 0.7451628554485628,
"learning_rate": 3.558510840120594e-05,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4016644358634949,
"step": 1300,
"valid_targets_mean": 3308.9,
"valid_targets_min": 1237
},
{
"epoch": 2.068145800316957,
"grad_norm": 0.7479732131470967,
"learning_rate": 3.553545586386392e-05,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3414376974105835,
"step": 1305,
"valid_targets_mean": 3150.8,
"valid_targets_min": 929
},
{
"epoch": 2.076069730586371,
"grad_norm": 0.6039441228458018,
"learning_rate": 3.5485560727567686e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3465012311935425,
"step": 1310,
"valid_targets_mean": 3960.5,
"valid_targets_min": 1781
},
{
"epoch": 2.0839936608557843,
"grad_norm": 0.7773497361755427,
"learning_rate": 3.543542377147093e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37093955278396606,
"step": 1315,
"valid_targets_mean": 2705.9,
"valid_targets_min": 1477
},
{
"epoch": 2.091917591125198,
"grad_norm": 0.7862507036909796,
"learning_rate": 3.5385045778503574e-05,
"loss": 0.3685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4063432216644287,
"step": 1320,
"valid_targets_mean": 2707.6,
"valid_targets_min": 1327
},
{
"epoch": 2.0998415213946116,
"grad_norm": 0.9375539482705244,
"learning_rate": 3.533442753535952e-05,
"loss": 0.3756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35002627968788147,
"step": 1325,
"valid_targets_mean": 3312.0,
"valid_targets_min": 1131
},
{
"epoch": 2.1077654516640254,
"grad_norm": 0.7318154628229018,
"learning_rate": 3.528356983248438e-05,
"loss": 0.3599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35978320240974426,
"step": 1330,
"valid_targets_mean": 2899.5,
"valid_targets_min": 1433
},
{
"epoch": 2.115689381933439,
"grad_norm": 0.696363310675273,
"learning_rate": 3.523247346406311e-05,
"loss": 0.3605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32494083046913147,
"step": 1335,
"valid_targets_mean": 3550.9,
"valid_targets_min": 1021
},
{
"epoch": 2.1236133122028527,
"grad_norm": 0.8237973354896262,
"learning_rate": 3.518113922800765e-05,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35818031430244446,
"step": 1340,
"valid_targets_mean": 3031.8,
"valid_targets_min": 673
},
{
"epoch": 2.131537242472266,
"grad_norm": 0.66311971156985,
"learning_rate": 3.512956792594442e-05,
"loss": 0.3584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36689960956573486,
"step": 1345,
"valid_targets_mean": 3550.8,
"valid_targets_min": 950
},
{
"epoch": 2.13946117274168,
"grad_norm": 0.8721689360378009,
"learning_rate": 3.5077760363201835e-05,
"loss": 0.3464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.385911762714386,
"step": 1350,
"valid_targets_mean": 2141.8,
"valid_targets_min": 953
},
{
"epoch": 2.1473851030110933,
"grad_norm": 0.6726564862719653,
"learning_rate": 3.50257173487977e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3518974184989929,
"step": 1355,
"valid_targets_mean": 3165.7,
"valid_targets_min": 1298
},
{
"epoch": 2.155309033280507,
"grad_norm": 0.8591285613969092,
"learning_rate": 3.4973439695426606e-05,
"loss": 0.366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4314518868923187,
"step": 1360,
"valid_targets_mean": 2363.4,
"valid_targets_min": 1010
},
{
"epoch": 2.1632329635499206,
"grad_norm": 0.6640118779055022,
"learning_rate": 3.492092821944722e-05,
"loss": 0.3556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3326745629310608,
"step": 1365,
"valid_targets_mean": 3621.4,
"valid_targets_min": 1238
},
{
"epoch": 2.1711568938193344,
"grad_norm": 0.7418113772849524,
"learning_rate": 3.4868183740869544e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3442697525024414,
"step": 1370,
"valid_targets_mean": 2723.8,
"valid_targets_min": 1171
},
{
"epoch": 2.179080824088748,
"grad_norm": 0.7504301461052274,
"learning_rate": 3.48152070833421e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36825960874557495,
"step": 1375,
"valid_targets_mean": 2962.6,
"valid_targets_min": 1328
},
{
"epoch": 2.1870047543581617,
"grad_norm": 0.8957004442452282,
"learning_rate": 3.476199907413909e-05,
"loss": 0.3878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.412288099527359,
"step": 1380,
"valid_targets_mean": 2568.7,
"valid_targets_min": 1206
},
{
"epoch": 2.194928684627575,
"grad_norm": 0.7694928144436127,
"learning_rate": 3.4708560544147435e-05,
"loss": 0.3805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4149361252784729,
"step": 1385,
"valid_targets_mean": 2675.1,
"valid_targets_min": 1219
},
{
"epoch": 2.202852614896989,
"grad_norm": 0.7389166507314462,
"learning_rate": 3.465489232785388e-05,
"loss": 0.3659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32906919717788696,
"step": 1390,
"valid_targets_mean": 2730.8,
"valid_targets_min": 1188
},
{
"epoch": 2.2107765451664028,
"grad_norm": 0.79731266620094,
"learning_rate": 3.460099526333184e-05,
"loss": 0.3801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34242305159568787,
"step": 1395,
"valid_targets_mean": 2235.1,
"valid_targets_min": 982
},
{
"epoch": 2.218700475435816,
"grad_norm": 0.7176220862553758,
"learning_rate": 3.4546870192228446e-05,
"loss": 0.3528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36401069164276123,
"step": 1400,
"valid_targets_mean": 3310.4,
"valid_targets_min": 1168
},
{
"epoch": 2.2266244057052296,
"grad_norm": 0.6300501071926575,
"learning_rate": 3.449251795975132e-05,
"loss": 0.4117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3608476519584656,
"step": 1405,
"valid_targets_mean": 3842.1,
"valid_targets_min": 1080
},
{
"epoch": 2.2345483359746434,
"grad_norm": 0.6586933639077392,
"learning_rate": 3.4437939414655375e-05,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29544296860694885,
"step": 1410,
"valid_targets_mean": 2897.9,
"valid_targets_min": 992
},
{
"epoch": 2.2424722662440573,
"grad_norm": 0.747007744021972,
"learning_rate": 3.438313540922961e-05,
"loss": 0.3768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.378732293844223,
"step": 1415,
"valid_targets_mean": 2782.6,
"valid_targets_min": 1405
},
{
"epoch": 2.2503961965134707,
"grad_norm": 0.8127811072244645,
"learning_rate": 3.432810679928376e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4382305145263672,
"step": 1420,
"valid_targets_mean": 2800.4,
"valid_targets_min": 1318
},
{
"epoch": 2.258320126782884,
"grad_norm": 0.7157439338354276,
"learning_rate": 3.427285444413495e-05,
"loss": 0.3528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3332955241203308,
"step": 1425,
"valid_targets_mean": 3116.9,
"valid_targets_min": 1673
},
{
"epoch": 2.266244057052298,
"grad_norm": 0.6962204553743823,
"learning_rate": 3.421737920659427e-05,
"loss": 0.349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32148024439811707,
"step": 1430,
"valid_targets_mean": 2878.9,
"valid_targets_min": 871
},
{
"epoch": 2.2741679873217118,
"grad_norm": 0.713354512987655,
"learning_rate": 3.416168195295329e-05,
"loss": 0.3591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3718951940536499,
"step": 1435,
"valid_targets_mean": 3088.2,
"valid_targets_min": 1342
},
{
"epoch": 2.282091917591125,
"grad_norm": 0.7008120501571135,
"learning_rate": 3.410576355297056e-05,
"loss": 0.3556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33514919877052307,
"step": 1440,
"valid_targets_mean": 2861.1,
"valid_targets_min": 1199
},
{
"epoch": 2.2900158478605386,
"grad_norm": 0.806299441185959,
"learning_rate": 3.404962487985801e-05,
"loss": 0.3668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3846312463283539,
"step": 1445,
"valid_targets_mean": 2405.8,
"valid_targets_min": 831
},
{
"epoch": 2.2979397781299524,
"grad_norm": 0.761461112866616,
"learning_rate": 3.399326681026731e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38813963532447815,
"step": 1450,
"valid_targets_mean": 2826.6,
"valid_targets_min": 1430
},
{
"epoch": 2.3058637083993663,
"grad_norm": 0.9191487962494499,
"learning_rate": 3.3936690224276194e-05,
"loss": 0.3761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4349742531776428,
"step": 1455,
"valid_targets_mean": 2471.1,
"valid_targets_min": 809
},
{
"epoch": 2.3137876386687797,
"grad_norm": 0.6867460029163497,
"learning_rate": 3.3879896005374705e-05,
"loss": 0.3772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3719336986541748,
"step": 1460,
"valid_targets_mean": 3600.1,
"valid_targets_min": 640
},
{
"epoch": 2.3217115689381935,
"grad_norm": 0.7140439142369251,
"learning_rate": 3.382288504045141e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3862805962562561,
"step": 1465,
"valid_targets_mean": 3404.2,
"valid_targets_min": 434
},
{
"epoch": 2.329635499207607,
"grad_norm": 0.845295556326319,
"learning_rate": 3.3765658219779537e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39049577713012695,
"step": 1470,
"valid_targets_mean": 2238.2,
"valid_targets_min": 767
},
{
"epoch": 2.337559429477021,
"grad_norm": 0.6210399121619489,
"learning_rate": 3.370821643700307e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34238991141319275,
"step": 1475,
"valid_targets_mean": 3526.3,
"valid_targets_min": 1052
},
{
"epoch": 2.345483359746434,
"grad_norm": 0.670480766135351,
"learning_rate": 3.365056058912282e-05,
"loss": 0.383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33082759380340576,
"step": 1480,
"valid_targets_mean": 3321.8,
"valid_targets_min": 1409
},
{
"epoch": 2.353407290015848,
"grad_norm": 0.6766348332163563,
"learning_rate": 3.3592691576482414e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3270394206047058,
"step": 1485,
"valid_targets_mean": 3748.6,
"valid_targets_min": 1485
},
{
"epoch": 2.3613312202852614,
"grad_norm": 0.7949053191718662,
"learning_rate": 3.353461030275418e-05,
"loss": 0.3774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3639070391654968,
"step": 1490,
"valid_targets_mean": 3388.0,
"valid_targets_min": 623
},
{
"epoch": 2.3692551505546753,
"grad_norm": 0.7129315145411875,
"learning_rate": 3.3476317674925126e-05,
"loss": 0.3551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3307371735572815,
"step": 1495,
"valid_targets_mean": 3125.2,
"valid_targets_min": 1123
},
{
"epoch": 2.3771790808240887,
"grad_norm": 0.7319999465255304,
"learning_rate": 3.341781460328267e-05,
"loss": 0.3705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3839896619319916,
"step": 1500,
"valid_targets_mean": 2962.8,
"valid_targets_min": 1040
},
{
"epoch": 2.3851030110935025,
"grad_norm": 0.7492489121406776,
"learning_rate": 3.3359102001400555e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3603183627128601,
"step": 1505,
"valid_targets_mean": 2949.4,
"valid_targets_min": 605
},
{
"epoch": 2.393026941362916,
"grad_norm": 0.7950258446330948,
"learning_rate": 3.330018078612446e-05,
"loss": 0.3737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37683820724487305,
"step": 1510,
"valid_targets_mean": 2834.4,
"valid_targets_min": 916
},
{
"epoch": 2.40095087163233,
"grad_norm": 0.8185064986671969,
"learning_rate": 3.324105187755775e-05,
"loss": 0.3676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38336193561553955,
"step": 1515,
"valid_targets_mean": 2173.2,
"valid_targets_min": 1103
},
{
"epoch": 2.408874801901743,
"grad_norm": 0.6460844220432804,
"learning_rate": 3.318171619904709e-05,
"loss": 0.3755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34656602144241333,
"step": 1520,
"valid_targets_mean": 3330.8,
"valid_targets_min": 1132
},
{
"epoch": 2.416798732171157,
"grad_norm": 0.6942145163373754,
"learning_rate": 3.3122174677168027e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.392851322889328,
"step": 1525,
"valid_targets_mean": 3246.0,
"valid_targets_min": 305
},
{
"epoch": 2.4247226624405704,
"grad_norm": 0.6507292400611256,
"learning_rate": 3.306242824171053e-05,
"loss": 0.3824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38254374265670776,
"step": 1530,
"valid_targets_mean": 3621.5,
"valid_targets_min": 1123
},
{
"epoch": 2.4326465927099843,
"grad_norm": 0.7278179160659652,
"learning_rate": 3.300247782566445e-05,
"loss": 0.3678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3891586661338806,
"step": 1535,
"valid_targets_mean": 3476.8,
"valid_targets_min": 1357
},
{
"epoch": 2.4405705229793977,
"grad_norm": 0.6983942948833125,
"learning_rate": 3.294232436520499e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33123183250427246,
"step": 1540,
"valid_targets_mean": 3465.1,
"valid_targets_min": 1288
},
{
"epoch": 2.4484944532488115,
"grad_norm": 0.6594224791344621,
"learning_rate": 3.288196879967801e-05,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38076046109199524,
"step": 1545,
"valid_targets_mean": 3734.8,
"valid_targets_min": 1161
},
{
"epoch": 2.456418383518225,
"grad_norm": 0.7471632828891966,
"learning_rate": 3.282141207158546e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3740571141242981,
"step": 1550,
"valid_targets_mean": 3052.6,
"valid_targets_min": 1220
},
{
"epoch": 2.464342313787639,
"grad_norm": 0.7075053052011875,
"learning_rate": 3.276065512657058e-05,
"loss": 0.3705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3714832663536072,
"step": 1555,
"valid_targets_mean": 3095.8,
"valid_targets_min": 1603
},
{
"epoch": 2.472266244057052,
"grad_norm": 0.7245176872705255,
"learning_rate": 3.269969891340315e-05,
"loss": 0.3577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3616369664669037,
"step": 1560,
"valid_targets_mean": 3465.4,
"valid_targets_min": 911
},
{
"epoch": 2.480190174326466,
"grad_norm": 0.707650235922073,
"learning_rate": 3.263854438396473e-05,
"loss": 0.3522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3539058268070221,
"step": 1565,
"valid_targets_mean": 3309.2,
"valid_targets_min": 1521
},
{
"epoch": 2.4881141045958794,
"grad_norm": 0.7349689198868826,
"learning_rate": 3.257719249323371e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37612348794937134,
"step": 1570,
"valid_targets_mean": 2882.0,
"valid_targets_min": 1184
},
{
"epoch": 2.4960380348652933,
"grad_norm": 0.9170986597030537,
"learning_rate": 3.251564419927046e-05,
"loss": 0.3602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39871150255203247,
"step": 1575,
"valid_targets_mean": 2766.1,
"valid_targets_min": 1338
},
{
"epoch": 2.5039619651347067,
"grad_norm": 0.6961153396437054,
"learning_rate": 3.245390046320234e-05,
"loss": 0.3558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3306850492954254,
"step": 1580,
"valid_targets_mean": 3363.3,
"valid_targets_min": 1641
},
{
"epoch": 2.5118858954041206,
"grad_norm": 0.695789931766822,
"learning_rate": 3.239196224920873e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37488996982574463,
"step": 1585,
"valid_targets_mean": 3035.2,
"valid_targets_min": 969
},
{
"epoch": 2.519809825673534,
"grad_norm": 0.7571853645906732,
"learning_rate": 3.232983052450588e-05,
"loss": 0.3649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3629456162452698,
"step": 1590,
"valid_targets_mean": 2581.4,
"valid_targets_min": 1175
},
{
"epoch": 2.527733755942948,
"grad_norm": 0.7703230366613334,
"learning_rate": 3.2267506259331936e-05,
"loss": 0.398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4350147843360901,
"step": 1595,
"valid_targets_mean": 2874.7,
"valid_targets_min": 1122
},
{
"epoch": 2.535657686212361,
"grad_norm": 0.6346611462613172,
"learning_rate": 3.220499042693167e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34332937002182007,
"step": 1600,
"valid_targets_mean": 3585.5,
"valid_targets_min": 1364
},
{
"epoch": 2.543581616481775,
"grad_norm": 0.8006448514494869,
"learning_rate": 3.214228400354137e-05,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40395885705947876,
"step": 1605,
"valid_targets_mean": 3247.1,
"valid_targets_min": 1270
},
{
"epoch": 2.5515055467511885,
"grad_norm": 0.7559604723688351,
"learning_rate": 3.207938796837354e-05,
"loss": 0.3904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37246257066726685,
"step": 1610,
"valid_targets_mean": 2641.6,
"valid_targets_min": 1071
},
{
"epoch": 2.5594294770206023,
"grad_norm": 0.7353157217889033,
"learning_rate": 3.201630330360165e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3442043662071228,
"step": 1615,
"valid_targets_mean": 2777.2,
"valid_targets_min": 1471
},
{
"epoch": 2.5673534072900157,
"grad_norm": 0.720107392698628,
"learning_rate": 3.195303099434474e-05,
"loss": 0.3699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41481178998947144,
"step": 1620,
"valid_targets_mean": 3245.4,
"valid_targets_min": 954
},
{
"epoch": 2.5752773375594296,
"grad_norm": 0.776231256992938,
"learning_rate": 3.1889572028652106e-05,
"loss": 0.368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36978304386138916,
"step": 1625,
"valid_targets_mean": 2458.1,
"valid_targets_min": 1103
},
{
"epoch": 2.583201267828843,
"grad_norm": 0.6657358034169792,
"learning_rate": 3.182592739748783e-05,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37111061811447144,
"step": 1630,
"valid_targets_mean": 3370.6,
"valid_targets_min": 1365
},
{
"epoch": 2.591125198098257,
"grad_norm": 0.6712733739184077,
"learning_rate": 3.17620980947153e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34165388345718384,
"step": 1635,
"valid_targets_mean": 3146.2,
"valid_targets_min": 1259
},
{
"epoch": 2.59904912836767,
"grad_norm": 0.8228340893308538,
"learning_rate": 3.1698085117081725e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4077662229537964,
"step": 1640,
"valid_targets_mean": 2459.1,
"valid_targets_min": 719
},
{
"epoch": 2.606973058637084,
"grad_norm": 0.7144944121446368,
"learning_rate": 3.163388946420253e-05,
"loss": 0.3697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37951573729515076,
"step": 1645,
"valid_targets_mean": 2752.9,
"valid_targets_min": 1282
},
{
"epoch": 2.6148969889064975,
"grad_norm": 0.8614676246761742,
"learning_rate": 3.156951213854578e-05,
"loss": 0.3758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3518531024456024,
"step": 1650,
"valid_targets_mean": 3622.9,
"valid_targets_min": 1274
},
{
"epoch": 2.6228209191759113,
"grad_norm": 0.6797007118760665,
"learning_rate": 3.1504954145416494e-05,
"loss": 0.3624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.354215145111084,
"step": 1655,
"valid_targets_mean": 3218.9,
"valid_targets_min": 1131
},
{
"epoch": 2.6307448494453247,
"grad_norm": 0.6901202480893878,
"learning_rate": 3.144021649294096e-05,
"loss": 0.3741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36378616094589233,
"step": 1660,
"valid_targets_mean": 3135.1,
"valid_targets_min": 1197
},
{
"epoch": 2.6386687797147386,
"grad_norm": 0.72642791007056,
"learning_rate": 3.137530019205104e-05,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361148238182068,
"step": 1665,
"valid_targets_mean": 3140.4,
"valid_targets_min": 1078
},
{
"epoch": 2.6465927099841524,
"grad_norm": 0.736512606598198,
"learning_rate": 3.131020625646827e-05,
"loss": 0.3533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36432206630706787,
"step": 1670,
"valid_targets_mean": 2840.2,
"valid_targets_min": 1376
},
{
"epoch": 2.654516640253566,
"grad_norm": 0.7161092212114627,
"learning_rate": 3.124493570268815e-05,
"loss": 0.3697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.384030282497406,
"step": 1675,
"valid_targets_mean": 3557.6,
"valid_targets_min": 1364
},
{
"epoch": 2.662440570522979,
"grad_norm": 0.6866773135599233,
"learning_rate": 3.117948954996419e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3353482186794281,
"step": 1680,
"valid_targets_mean": 3323.8,
"valid_targets_min": 1241
},
{
"epoch": 2.670364500792393,
"grad_norm": 0.7214323381715583,
"learning_rate": 3.111386882029205e-05,
"loss": 0.3557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3556535243988037,
"step": 1685,
"valid_targets_mean": 2939.8,
"valid_targets_min": 465
},
{
"epoch": 2.678288431061807,
"grad_norm": 0.7532775358119311,
"learning_rate": 3.1048074538393515e-05,
"loss": 0.3705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3484819531440735,
"step": 1690,
"valid_targets_mean": 2753.2,
"valid_targets_min": 926
},
{
"epoch": 2.6862123613312203,
"grad_norm": 0.7196890582839597,
"learning_rate": 3.098210773170057e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39478743076324463,
"step": 1695,
"valid_targets_mean": 3182.8,
"valid_targets_min": 1825
},
{
"epoch": 2.6941362916006337,
"grad_norm": 0.6412851439845717,
"learning_rate": 3.0915969430339285e-05,
"loss": 0.3788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4072532057762146,
"step": 1700,
"valid_targets_mean": 3858.4,
"valid_targets_min": 1152
},
{
"epoch": 2.7020602218700476,
"grad_norm": 0.8200510450598304,
"learning_rate": 3.0849660667113785e-05,
"loss": 0.3806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4585651159286499,
"step": 1705,
"valid_targets_mean": 2658.2,
"valid_targets_min": 949
},
{
"epoch": 2.7099841521394614,
"grad_norm": 0.8199512586359826,
"learning_rate": 3.078318247749009e-05,
"loss": 0.3819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43864548206329346,
"step": 1710,
"valid_targets_mean": 2758.8,
"valid_targets_min": 805
},
{
"epoch": 2.717908082408875,
"grad_norm": 0.7912495090847645,
"learning_rate": 3.0716535899579936e-05,
"loss": 0.3429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3498538136482239,
"step": 1715,
"valid_targets_mean": 2157.8,
"valid_targets_min": 926
},
{
"epoch": 2.7258320126782882,
"grad_norm": 0.5876938155418893,
"learning_rate": 3.0649721974124606e-05,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32150182127952576,
"step": 1720,
"valid_targets_mean": 3719.1,
"valid_targets_min": 883
},
{
"epoch": 2.733755942947702,
"grad_norm": 0.877583762546389,
"learning_rate": 3.058274174447864e-05,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39479172229766846,
"step": 1725,
"valid_targets_mean": 2071.7,
"valid_targets_min": 994
},
{
"epoch": 2.741679873217116,
"grad_norm": 0.6592647942561869,
"learning_rate": 3.0515596256593566e-05,
"loss": 0.335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32501962780952454,
"step": 1730,
"valid_targets_mean": 3369.1,
"valid_targets_min": 1144
},
{
"epoch": 2.7496038034865293,
"grad_norm": 0.7657355885140038,
"learning_rate": 3.044828655900153e-05,
"loss": 0.3834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3660418391227722,
"step": 1735,
"valid_targets_mean": 2924.8,
"valid_targets_min": 1083
},
{
"epoch": 2.7575277337559427,
"grad_norm": 0.7593994147389292,
"learning_rate": 3.0380813702798975e-05,
"loss": 0.3765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38318681716918945,
"step": 1740,
"valid_targets_mean": 2862.4,
"valid_targets_min": 923
},
{
"epoch": 2.7654516640253566,
"grad_norm": 0.8032261353715695,
"learning_rate": 3.0313178741630193e-05,
"loss": 0.3775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4111163914203644,
"step": 1745,
"valid_targets_mean": 2419.5,
"valid_targets_min": 845
},
{
"epoch": 2.7733755942947704,
"grad_norm": 0.7917662706861506,
"learning_rate": 3.0245382731670872e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40242886543273926,
"step": 1750,
"valid_targets_mean": 2851.2,
"valid_targets_min": 824
},
{
"epoch": 2.781299524564184,
"grad_norm": 0.6994549455580847,
"learning_rate": 3.017742673161161e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36322033405303955,
"step": 1755,
"valid_targets_mean": 3588.1,
"valid_targets_min": 680
},
{
"epoch": 2.7892234548335972,
"grad_norm": 0.6902449352365942,
"learning_rate": 3.0109311802641394e-05,
"loss": 0.3745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3887173533439636,
"step": 1760,
"valid_targets_mean": 3538.9,
"valid_targets_min": 1645
},
{
"epoch": 2.797147385103011,
"grad_norm": 0.6572463116289267,
"learning_rate": 3.0041039008431006e-05,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3245548605918884,
"step": 1765,
"valid_targets_mean": 3434.0,
"valid_targets_min": 1483
},
{
"epoch": 2.805071315372425,
"grad_norm": 0.7520916361470656,
"learning_rate": 2.9972609415116424e-05,
"loss": 0.3595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36480066180229187,
"step": 1770,
"valid_targets_mean": 2674.7,
"valid_targets_min": 1341
},
{
"epoch": 2.8129952456418383,
"grad_norm": 0.7013146155031664,
"learning_rate": 2.990402409128218e-05,
"loss": 0.3546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3468988239765167,
"step": 1775,
"valid_targets_mean": 3095.1,
"valid_targets_min": 1131
},
{
"epoch": 2.8209191759112517,
"grad_norm": 0.8604280966015914,
"learning_rate": 2.983528410794466e-05,
"loss": 0.3695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36563342809677124,
"step": 1780,
"valid_targets_mean": 2494.7,
"valid_targets_min": 875
},
{
"epoch": 2.8288431061806656,
"grad_norm": 0.8186766988561371,
"learning_rate": 2.9766390538535382e-05,
"loss": 0.3649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3959285318851471,
"step": 1785,
"valid_targets_mean": 2253.1,
"valid_targets_min": 907
},
{
"epoch": 2.8367670364500794,
"grad_norm": 0.9075815131643683,
"learning_rate": 2.9697344458884265e-05,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34358176589012146,
"step": 1790,
"valid_targets_mean": 2338.9,
"valid_targets_min": 1106
},
{
"epoch": 2.844690966719493,
"grad_norm": 0.7043856446767114,
"learning_rate": 2.9628146947202756e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.354300856590271,
"step": 1795,
"valid_targets_mean": 3277.2,
"valid_targets_min": 1262
},
{
"epoch": 2.8526148969889062,
"grad_norm": 0.7370078841642661,
"learning_rate": 2.9558799084067074e-05,
"loss": 0.3718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38159167766571045,
"step": 1800,
"valid_targets_mean": 2703.7,
"valid_targets_min": 1027
},
{
"epoch": 2.86053882725832,
"grad_norm": 0.6990022019648595,
"learning_rate": 2.9489301952401286e-05,
"loss": 0.3522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3276500403881073,
"step": 1805,
"valid_targets_mean": 3995.8,
"valid_targets_min": 675
},
{
"epoch": 2.868462757527734,
"grad_norm": 0.6638533677079017,
"learning_rate": 2.9419656637460413e-05,
"loss": 0.3624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3156994581222534,
"step": 1810,
"valid_targets_mean": 3012.8,
"valid_targets_min": 699
},
{
"epoch": 2.8763866877971473,
"grad_norm": 0.650719515262378,
"learning_rate": 2.9349864226813475e-05,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3329174518585205,
"step": 1815,
"valid_targets_mean": 3597.6,
"valid_targets_min": 1418
},
{
"epoch": 2.8843106180665607,
"grad_norm": 0.7687174401357069,
"learning_rate": 2.9279925810326516e-05,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37216711044311523,
"step": 1820,
"valid_targets_mean": 3317.2,
"valid_targets_min": 1141
},
{
"epoch": 2.8922345483359746,
"grad_norm": 0.6216599334752763,
"learning_rate": 2.9209842480145587e-05,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3306935429573059,
"step": 1825,
"valid_targets_mean": 3728.8,
"valid_targets_min": 1048
},
{
"epoch": 2.9001584786053884,
"grad_norm": 0.7206089378146915,
"learning_rate": 2.913961533067968e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34333550930023193,
"step": 1830,
"valid_targets_mean": 3466.3,
"valid_targets_min": 1167
},
{
"epoch": 2.908082408874802,
"grad_norm": 0.7578107255518666,
"learning_rate": 2.906924545858364e-05,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3424595296382904,
"step": 1835,
"valid_targets_mean": 2490.8,
"valid_targets_min": 805
},
{
"epoch": 2.9160063391442153,
"grad_norm": 0.7453104444181963,
"learning_rate": 2.8998733962741057e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3626144528388977,
"step": 1840,
"valid_targets_mean": 2894.9,
"valid_targets_min": 1095
},
{
"epoch": 2.923930269413629,
"grad_norm": 0.7718015723542487,
"learning_rate": 2.8928081944247088e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3860081732273102,
"step": 1845,
"valid_targets_mean": 3889.6,
"valid_targets_min": 823
},
{
"epoch": 2.931854199683043,
"grad_norm": 0.7045879397030554,
"learning_rate": 2.8857290506391243e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36101579666137695,
"step": 1850,
"valid_targets_mean": 2874.3,
"valid_targets_min": 1195
},
{
"epoch": 2.9397781299524564,
"grad_norm": 0.717984417244567,
"learning_rate": 2.8786360754640213e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34760263562202454,
"step": 1855,
"valid_targets_mean": 2920.6,
"valid_targets_min": 1236
},
{
"epoch": 2.94770206022187,
"grad_norm": 0.6640139889083639,
"learning_rate": 2.8715293796620565e-05,
"loss": 0.3623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4223308265209198,
"step": 1860,
"valid_targets_mean": 3860.2,
"valid_targets_min": 1403
},
{
"epoch": 2.9556259904912836,
"grad_norm": 0.6392198399783302,
"learning_rate": 2.8644090742101444e-05,
"loss": 0.3495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32980644702911377,
"step": 1865,
"valid_targets_mean": 3921.6,
"valid_targets_min": 1156
},
{
"epoch": 2.9635499207606975,
"grad_norm": 0.6870381101356648,
"learning_rate": 2.8572752702977265e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3842689096927643,
"step": 1870,
"valid_targets_mean": 3652.7,
"valid_targets_min": 1219
},
{
"epoch": 2.971473851030111,
"grad_norm": 0.8762796489016127,
"learning_rate": 2.8501280793250343e-05,
"loss": 0.3851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41141873598098755,
"step": 1875,
"valid_targets_mean": 2225.3,
"valid_targets_min": 1208
},
{
"epoch": 2.9793977812995247,
"grad_norm": 0.8115620338836479,
"learning_rate": 2.8429676129013476e-05,
"loss": 0.3629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3620631694793701,
"step": 1880,
"valid_targets_mean": 2161.6,
"valid_targets_min": 850
},
{
"epoch": 2.987321711568938,
"grad_norm": 0.7750980053703787,
"learning_rate": 2.835793982843255e-05,
"loss": 0.3818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.373153418302536,
"step": 1885,
"valid_targets_mean": 2862.1,
"valid_targets_min": 967
},
{
"epoch": 2.995245641838352,
"grad_norm": 0.7322316673204433,
"learning_rate": 2.8286073011729044e-05,
"loss": 0.3654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3833129405975342,
"step": 1890,
"valid_targets_mean": 3081.8,
"valid_targets_min": 1661
},
{
"epoch": 3.0031695721077654,
"grad_norm": 0.6065227488494328,
"learning_rate": 2.8214076801162575e-05,
"loss": 0.3712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34482842683792114,
"step": 1895,
"valid_targets_mean": 3981.5,
"valid_targets_min": 1418
},
{
"epoch": 3.011093502377179,
"grad_norm": 0.6901979613206464,
"learning_rate": 2.814195232101334e-05,
"loss": 0.3455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35832148790359497,
"step": 1900,
"valid_targets_mean": 3975.4,
"valid_targets_min": 1122
},
{
"epoch": 3.0190174326465926,
"grad_norm": 0.7186510353720049,
"learning_rate": 2.806970069756456e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30415624380111694,
"step": 1905,
"valid_targets_mean": 3198.1,
"valid_targets_min": 957
},
{
"epoch": 3.0269413629160065,
"grad_norm": 0.6882830013798815,
"learning_rate": 2.7997323059084926e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30928438901901245,
"step": 1910,
"valid_targets_mean": 3419.6,
"valid_targets_min": 1590
},
{
"epoch": 3.03486529318542,
"grad_norm": 0.7774880183981414,
"learning_rate": 2.7924820535810947e-05,
"loss": 0.3444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3439940810203552,
"step": 1915,
"valid_targets_mean": 2875.5,
"valid_targets_min": 742
},
{
"epoch": 3.0427892234548337,
"grad_norm": 0.7838015454420495,
"learning_rate": 2.7852194259929306e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3384024500846863,
"step": 1920,
"valid_targets_mean": 3003.9,
"valid_targets_min": 988
},
{
"epoch": 3.050713153724247,
"grad_norm": 0.7416290199481121,
"learning_rate": 2.7779445365559196e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35700756311416626,
"step": 1925,
"valid_targets_mean": 3207.6,
"valid_targets_min": 987
},
{
"epoch": 3.058637083993661,
"grad_norm": 0.7414194431448803,
"learning_rate": 2.7706574988734596e-05,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35844355821609497,
"step": 1930,
"valid_targets_mean": 3496.2,
"valid_targets_min": 1326
},
{
"epoch": 3.0665610142630744,
"grad_norm": 0.7113811917186736,
"learning_rate": 2.7633584267386518e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29518628120422363,
"step": 1935,
"valid_targets_mean": 3124.2,
"valid_targets_min": 680
},
{
"epoch": 3.074484944532488,
"grad_norm": 0.8314704271197847,
"learning_rate": 2.7560474341325276e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3693086504936218,
"step": 1940,
"valid_targets_mean": 2553.4,
"valid_targets_min": 956
},
{
"epoch": 3.0824088748019016,
"grad_norm": 0.7863210609659544,
"learning_rate": 2.7487246352222648e-05,
"loss": 0.3264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29878532886505127,
"step": 1945,
"valid_targets_mean": 2444.7,
"valid_targets_min": 672
},
{
"epoch": 3.0903328050713155,
"grad_norm": 0.7257330134496905,
"learning_rate": 2.7413901443594073e-05,
"loss": 0.3155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30191296339035034,
"step": 1950,
"valid_targets_mean": 3476.1,
"valid_targets_min": 1206
},
{
"epoch": 3.098256735340729,
"grad_norm": 0.8065297599365323,
"learning_rate": 2.7340440760780778e-05,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32383155822753906,
"step": 1955,
"valid_targets_mean": 2889.2,
"valid_targets_min": 929
},
{
"epoch": 3.1061806656101427,
"grad_norm": 0.712007666432261,
"learning_rate": 2.7266865450931907e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361831307411194,
"step": 1960,
"valid_targets_mean": 3199.6,
"valid_targets_min": 1270
},
{
"epoch": 3.114104595879556,
"grad_norm": 0.7794712083869874,
"learning_rate": 2.7193176662986593e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3365066647529602,
"step": 1965,
"valid_targets_mean": 2549.4,
"valid_targets_min": 989
},
{
"epoch": 3.12202852614897,
"grad_norm": 0.8498632060188069,
"learning_rate": 2.7119375547656025e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34931614995002747,
"step": 1970,
"valid_targets_mean": 2771.6,
"valid_targets_min": 1096
},
{
"epoch": 3.1299524564183834,
"grad_norm": 0.7075486291042362,
"learning_rate": 2.704546325740548e-05,
"loss": 0.3357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31514453887939453,
"step": 1975,
"valid_targets_mean": 3283.4,
"valid_targets_min": 904
},
{
"epoch": 3.1378763866877972,
"grad_norm": 0.8262903637467062,
"learning_rate": 2.6971440946436306e-05,
"loss": 0.333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3372984528541565,
"step": 1980,
"valid_targets_mean": 2639.2,
"valid_targets_min": 1053
},
{
"epoch": 3.1458003169572106,
"grad_norm": 0.6978216538446294,
"learning_rate": 2.689730977066795e-05,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3109763264656067,
"step": 1985,
"valid_targets_mean": 3200.6,
"valid_targets_min": 860
},
{
"epoch": 3.1537242472266245,
"grad_norm": 0.740783802930712,
"learning_rate": 2.682307088771984e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35412776470184326,
"step": 1990,
"valid_targets_mean": 3045.1,
"valid_targets_min": 998
},
{
"epoch": 3.161648177496038,
"grad_norm": 0.8656214600333869,
"learning_rate": 2.6748725456893355e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32956281304359436,
"step": 1995,
"valid_targets_mean": 2030.4,
"valid_targets_min": 968
},
{
"epoch": 3.1695721077654517,
"grad_norm": 0.7377230964997741,
"learning_rate": 2.66742746391537e-05,
"loss": 0.3513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3444298505783081,
"step": 2000,
"valid_targets_mean": 3455.4,
"valid_targets_min": 1280
},
{
"epoch": 3.177496038034865,
"grad_norm": 0.7541796485264278,
"learning_rate": 2.6599719597111794e-05,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3887772560119629,
"step": 2005,
"valid_targets_mean": 3408.1,
"valid_targets_min": 1341
},
{
"epoch": 3.185419968304279,
"grad_norm": 0.7815456449009791,
"learning_rate": 2.6525061495006103e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3660275936126709,
"step": 2010,
"valid_targets_mean": 3231.4,
"valid_targets_min": 1124
},
{
"epoch": 3.1933438985736924,
"grad_norm": 0.6900245267272553,
"learning_rate": 2.6450301498684443e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34687238931655884,
"step": 2015,
"valid_targets_mean": 3574.1,
"valid_targets_min": 1302
},
{
"epoch": 3.2012678288431062,
"grad_norm": 0.7549001056433992,
"learning_rate": 2.637544077558581e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3526916205883026,
"step": 2020,
"valid_targets_mean": 3198.1,
"valid_targets_min": 1741
},
{
"epoch": 3.2091917591125196,
"grad_norm": 0.7851430991597503,
"learning_rate": 2.630048049472213e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3379470705986023,
"step": 2025,
"valid_targets_mean": 2515.5,
"valid_targets_min": 323
},
{
"epoch": 3.2171156893819335,
"grad_norm": 0.7004928403794375,
"learning_rate": 2.622542182666e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32637515664100647,
"step": 2030,
"valid_targets_mean": 3517.1,
"valid_targets_min": 1042
},
{
"epoch": 3.225039619651347,
"grad_norm": 0.7764554104098883,
"learning_rate": 2.6150265943502424e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3583545684814453,
"step": 2035,
"valid_targets_mean": 2765.4,
"valid_targets_min": 881
},
{
"epoch": 3.2329635499207607,
"grad_norm": 0.6465157812209109,
"learning_rate": 2.6075014018870483e-05,
"loss": 0.3167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3526315689086914,
"step": 2040,
"valid_targets_mean": 4235.4,
"valid_targets_min": 1086
},
{
"epoch": 3.240887480190174,
"grad_norm": 0.706625007326448,
"learning_rate": 2.599966722788504e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2997731566429138,
"step": 2045,
"valid_targets_mean": 3172.4,
"valid_targets_min": 1201
},
{
"epoch": 3.248811410459588,
"grad_norm": 0.7850578365104528,
"learning_rate": 2.5924226747148372e-05,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30590397119522095,
"step": 2050,
"valid_targets_mean": 2757.9,
"valid_targets_min": 1061
},
{
"epoch": 3.2567353407290014,
"grad_norm": 0.6518087609710441,
"learning_rate": 2.584869375472579e-05,
"loss": 0.3183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29854464530944824,
"step": 2055,
"valid_targets_mean": 3279.2,
"valid_targets_min": 1107
},
{
"epoch": 3.2646592709984152,
"grad_norm": 0.822500398616075,
"learning_rate": 2.577306943012725e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34053948521614075,
"step": 2060,
"valid_targets_mean": 2633.9,
"valid_targets_min": 1317
},
{
"epoch": 3.272583201267829,
"grad_norm": 0.8125115262492077,
"learning_rate": 2.569735495428896e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32668331265449524,
"step": 2065,
"valid_targets_mean": 2618.7,
"valid_targets_min": 786
},
{
"epoch": 3.2805071315372425,
"grad_norm": 1.4959208602319205,
"learning_rate": 2.562155150955488e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3204629421234131,
"step": 2070,
"valid_targets_mean": 2665.9,
"valid_targets_min": 1262
},
{
"epoch": 3.288431061806656,
"grad_norm": 0.611048992859609,
"learning_rate": 2.554566027965832e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2836368680000305,
"step": 2075,
"valid_targets_mean": 4082.5,
"valid_targets_min": 1157
},
{
"epoch": 3.2963549920760697,
"grad_norm": 0.7774858963866713,
"learning_rate": 2.5469682449703414e-05,
"loss": 0.3378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361954689025879,
"step": 2080,
"valid_targets_mean": 2990.8,
"valid_targets_min": 644
},
{
"epoch": 3.3042789223454836,
"grad_norm": 0.8182618562206451,
"learning_rate": 2.539361920614662e-05,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3528863191604614,
"step": 2085,
"valid_targets_mean": 2776.4,
"valid_targets_min": 1167
},
{
"epoch": 3.312202852614897,
"grad_norm": 0.7286378347810851,
"learning_rate": 2.5317471736778226e-05,
"loss": 0.3348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3281998038291931,
"step": 2090,
"valid_targets_mean": 3044.1,
"valid_targets_min": 592
},
{
"epoch": 3.3201267828843104,
"grad_norm": 0.5916476860001847,
"learning_rate": 2.524124123070375e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27134382724761963,
"step": 2095,
"valid_targets_mean": 4022.4,
"valid_targets_min": 836
},
{
"epoch": 3.3280507131537242,
"grad_norm": 0.8344841361605951,
"learning_rate": 2.5164928878325404e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33823129534721375,
"step": 2100,
"valid_targets_mean": 2500.5,
"valid_targets_min": 1030
},
{
"epoch": 3.335974643423138,
"grad_norm": 0.7080563566881553,
"learning_rate": 2.5088535871323502e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3264184594154358,
"step": 2105,
"valid_targets_mean": 3250.5,
"valid_targets_min": 1023
},
{
"epoch": 3.3438985736925515,
"grad_norm": 0.7908723696589502,
"learning_rate": 2.5012063402637843e-05,
"loss": 0.3421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35519134998321533,
"step": 2110,
"valid_targets_mean": 2987.3,
"valid_targets_min": 1241
},
{
"epoch": 3.351822503961965,
"grad_norm": 0.70839207204405,
"learning_rate": 2.4935512666449085e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31166577339172363,
"step": 2115,
"valid_targets_mean": 3060.3,
"valid_targets_min": 746
},
{
"epoch": 3.3597464342313788,
"grad_norm": 0.7933084485897915,
"learning_rate": 2.4858884858160107e-05,
"loss": 0.3242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3538547158241272,
"step": 2120,
"valid_targets_mean": 3038.3,
"valid_targets_min": 1106
},
{
"epoch": 3.3676703645007926,
"grad_norm": 0.7663074843622576,
"learning_rate": 2.4782181174377314e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.352549284696579,
"step": 2125,
"valid_targets_mean": 3099.4,
"valid_targets_min": 1095
},
{
"epoch": 3.375594294770206,
"grad_norm": 0.7138476967374972,
"learning_rate": 2.470540281289199e-05,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33138760924339294,
"step": 2130,
"valid_targets_mean": 2867.1,
"valid_targets_min": 1311
},
{
"epoch": 3.3835182250396194,
"grad_norm": 0.6633701832610104,
"learning_rate": 2.4628550972661557e-05,
"loss": 0.324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30286821722984314,
"step": 2135,
"valid_targets_mean": 3736.6,
"valid_targets_min": 1535
},
{
"epoch": 3.3914421553090333,
"grad_norm": 0.7181119752621806,
"learning_rate": 2.455162685379087e-05,
"loss": 0.3212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3247692286968231,
"step": 2140,
"valid_targets_mean": 3933.5,
"valid_targets_min": 1455
},
{
"epoch": 3.399366085578447,
"grad_norm": 0.58939690424488,
"learning_rate": 2.447463165751349e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28043270111083984,
"step": 2145,
"valid_targets_mean": 4510.4,
"valid_targets_min": 1619
},
{
"epoch": 3.4072900158478605,
"grad_norm": 0.6905860534611378,
"learning_rate": 2.4397566586172883e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31197258830070496,
"step": 2150,
"valid_targets_mean": 3251.9,
"valid_targets_min": 1084
},
{
"epoch": 3.4152139461172744,
"grad_norm": 0.7543811037179319,
"learning_rate": 2.4320432843203704e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33104807138442993,
"step": 2155,
"valid_targets_mean": 2821.9,
"valid_targets_min": 1396
},
{
"epoch": 3.4231378763866878,
"grad_norm": 0.7618177630066788,
"learning_rate": 2.4243231633112943e-05,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33463001251220703,
"step": 2160,
"valid_targets_mean": 3083.6,
"valid_targets_min": 1252
},
{
"epoch": 3.4310618066561016,
"grad_norm": 0.7273682305306333,
"learning_rate": 2.4165964161461167e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34640154242515564,
"step": 2165,
"valid_targets_mean": 3702.2,
"valid_targets_min": 1381
},
{
"epoch": 3.438985736925515,
"grad_norm": 0.6923581076598425,
"learning_rate": 2.408863163484366e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33265140652656555,
"step": 2170,
"valid_targets_mean": 3575.5,
"valid_targets_min": 605
},
{
"epoch": 3.446909667194929,
"grad_norm": 0.7329934998169874,
"learning_rate": 2.401123526087159e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3211047947406769,
"step": 2175,
"valid_targets_mean": 3020.9,
"valid_targets_min": 1398
},
{
"epoch": 3.4548335974643423,
"grad_norm": 0.6822054946764609,
"learning_rate": 2.3933776248153168e-05,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3279761075973511,
"step": 2180,
"valid_targets_mean": 3455.0,
"valid_targets_min": 1277
},
{
"epoch": 3.462757527733756,
"grad_norm": 0.6616693352625908,
"learning_rate": 2.385625580627474e-05,
"loss": 0.3282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3381684124469757,
"step": 2185,
"valid_targets_mean": 3872.2,
"valid_targets_min": 1192
},
{
"epoch": 3.4706814580031695,
"grad_norm": 0.7741372802839244,
"learning_rate": 2.377867514578194e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3979116678237915,
"step": 2190,
"valid_targets_mean": 3336.3,
"valid_targets_min": 997
},
{
"epoch": 3.4786053882725834,
"grad_norm": 0.7070236701033044,
"learning_rate": 2.3701035478160763e-05,
"loss": 0.349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35837632417678833,
"step": 2195,
"valid_targets_mean": 3782.2,
"valid_targets_min": 1485
},
{
"epoch": 3.4865293185419968,
"grad_norm": 0.7494594936521863,
"learning_rate": 2.3623338015818623e-05,
"loss": 0.3357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3438400626182556,
"step": 2200,
"valid_targets_mean": 2959.6,
"valid_targets_min": 663
},
{
"epoch": 3.4944532488114106,
"grad_norm": 0.6937608768005562,
"learning_rate": 2.3545583972065484e-05,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3017534911632538,
"step": 2205,
"valid_targets_mean": 3185.6,
"valid_targets_min": 900
},
{
"epoch": 3.502377179080824,
"grad_norm": 0.6888295505753116,
"learning_rate": 2.346777456109485e-05,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26715266704559326,
"step": 2210,
"valid_targets_mean": 2821.8,
"valid_targets_min": 944
},
{
"epoch": 3.510301109350238,
"grad_norm": 0.7118241028505115,
"learning_rate": 2.3389910997964832e-05,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3349294066429138,
"step": 2215,
"valid_targets_mean": 3142.1,
"valid_targets_min": 1146
},
{
"epoch": 3.5182250396196513,
"grad_norm": 0.7278682132311887,
"learning_rate": 2.3311994498579185e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29668980836868286,
"step": 2220,
"valid_targets_mean": 3287.6,
"valid_targets_min": 1218
},
{
"epoch": 3.526148969889065,
"grad_norm": 0.6941142765146813,
"learning_rate": 2.3234026279668296e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018149733543396,
"step": 2225,
"valid_targets_mean": 3132.2,
"valid_targets_min": 852
},
{
"epoch": 3.5340729001584785,
"grad_norm": 0.740242823338274,
"learning_rate": 2.3156007558770192e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31529009342193604,
"step": 2230,
"valid_targets_mean": 2922.2,
"valid_targets_min": 1057
},
{
"epoch": 3.5419968304278924,
"grad_norm": 0.8523972449816457,
"learning_rate": 2.307793955421154e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3462240397930145,
"step": 2235,
"valid_targets_mean": 2572.6,
"valid_targets_min": 951
},
{
"epoch": 3.5499207606973058,
"grad_norm": 0.7990562745382495,
"learning_rate": 2.299982348508861e-05,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3121604025363922,
"step": 2240,
"valid_targets_mean": 2908.9,
"valid_targets_min": 1118
},
{
"epoch": 3.5578446909667196,
"grad_norm": 0.6945315665088014,
"learning_rate": 2.2921660571248237e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33167335391044617,
"step": 2245,
"valid_targets_mean": 3621.6,
"valid_targets_min": 881
},
{
"epoch": 3.565768621236133,
"grad_norm": 0.6731796035427767,
"learning_rate": 2.2843452033268775e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30071955919265747,
"step": 2250,
"valid_targets_mean": 3450.9,
"valid_targets_min": 1051
},
{
"epoch": 3.573692551505547,
"grad_norm": 0.8546792122499989,
"learning_rate": 2.2765199092441033e-05,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39534080028533936,
"step": 2255,
"valid_targets_mean": 2804.2,
"valid_targets_min": 1371
},
{
"epoch": 3.5816164817749603,
"grad_norm": 0.8037548712670296,
"learning_rate": 2.2686902970749218e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.354625940322876,
"step": 2260,
"valid_targets_mean": 2839.2,
"valid_targets_min": 1273
},
{
"epoch": 3.589540412044374,
"grad_norm": 0.7463842550414609,
"learning_rate": 2.260856489085183e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3454499840736389,
"step": 2265,
"valid_targets_mean": 2875.6,
"valid_targets_min": 1522
},
{
"epoch": 3.5974643423137875,
"grad_norm": 0.7214338181235017,
"learning_rate": 2.2530186076062588e-05,
"loss": 0.3408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32981571555137634,
"step": 2270,
"valid_targets_mean": 3369.8,
"valid_targets_min": 1324
},
{
"epoch": 3.6053882725832014,
"grad_norm": 0.7266954380266903,
"learning_rate": 2.2451767750331316e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3404169976711273,
"step": 2275,
"valid_targets_mean": 3491.8,
"valid_targets_min": 1001
},
{
"epoch": 3.613312202852615,
"grad_norm": 0.7418997208137097,
"learning_rate": 2.2373311138224838e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31640252470970154,
"step": 2280,
"valid_targets_mean": 2498.8,
"valid_targets_min": 901
},
{
"epoch": 3.6212361331220286,
"grad_norm": 0.7680111061901961,
"learning_rate": 2.2294817464907852e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3239263594150543,
"step": 2285,
"valid_targets_mean": 2514.9,
"valid_targets_min": 1517
},
{
"epoch": 3.629160063391442,
"grad_norm": 0.6982918820606155,
"learning_rate": 2.221628795612379e-05,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32979482412338257,
"step": 2290,
"valid_targets_mean": 3441.3,
"valid_targets_min": 1224
},
{
"epoch": 3.637083993660856,
"grad_norm": 0.7261379689885271,
"learning_rate": 2.2137723838175693e-05,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3410705327987671,
"step": 2295,
"valid_targets_mean": 2833.8,
"valid_targets_min": 1138
},
{
"epoch": 3.6450079239302693,
"grad_norm": 0.7535963960315106,
"learning_rate": 2.205912633790704e-05,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.323788583278656,
"step": 2300,
"valid_targets_mean": 2891.2,
"valid_targets_min": 1241
},
{
"epoch": 3.652931854199683,
"grad_norm": 0.6969204879397259,
"learning_rate": 2.198049668268262e-05,
"loss": 0.3284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3207600712776184,
"step": 2305,
"valid_targets_mean": 3219.8,
"valid_targets_min": 1444
},
{
"epoch": 3.6608557844690965,
"grad_norm": 0.887306839014218,
"learning_rate": 2.1901836100369335e-05,
"loss": 0.3317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33578261733055115,
"step": 2310,
"valid_targets_mean": 2205.1,
"valid_targets_min": 906
},
{
"epoch": 3.6687797147385104,
"grad_norm": 0.9750572459180453,
"learning_rate": 2.1823145819317048e-05,
"loss": 0.3365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35123610496520996,
"step": 2315,
"valid_targets_mean": 2695.4,
"valid_targets_min": 1084
},
{
"epoch": 3.676703645007924,
"grad_norm": 0.7780709496343529,
"learning_rate": 2.174442706833938e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3519875109195709,
"step": 2320,
"valid_targets_mean": 2882.0,
"valid_targets_min": 807
},
{
"epoch": 3.6846275752773376,
"grad_norm": 0.7243496238272615,
"learning_rate": 2.1665681076694544e-05,
"loss": 0.3247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31398969888687134,
"step": 2325,
"valid_targets_mean": 2690.4,
"valid_targets_min": 732
},
{
"epoch": 3.692551505546751,
"grad_norm": 0.7526736641692691,
"learning_rate": 2.1586909074066136e-05,
"loss": 0.3462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34414851665496826,
"step": 2330,
"valid_targets_mean": 3210.9,
"valid_targets_min": 1143
},
{
"epoch": 3.700475435816165,
"grad_norm": 0.7452110101075897,
"learning_rate": 2.1508112290543933e-05,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3227662742137909,
"step": 2335,
"valid_targets_mean": 3213.6,
"valid_targets_min": 1032
},
{
"epoch": 3.7083993660855783,
"grad_norm": 0.7854460633468776,
"learning_rate": 2.142929195660469e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34010860323905945,
"step": 2340,
"valid_targets_mean": 2676.4,
"valid_targets_min": 933
},
{
"epoch": 3.716323296354992,
"grad_norm": 0.6656721032192763,
"learning_rate": 2.1350449303092917e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29363691806793213,
"step": 2345,
"valid_targets_mean": 3574.9,
"valid_targets_min": 1262
},
{
"epoch": 3.7242472266244055,
"grad_norm": 0.7337377728820911,
"learning_rate": 2.1271585561201666e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4165416359901428,
"step": 2350,
"valid_targets_mean": 3303.0,
"valid_targets_min": 1199
},
{
"epoch": 3.7321711568938194,
"grad_norm": 0.6641092113281405,
"learning_rate": 2.1192701962453296e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30195552110671997,
"step": 2355,
"valid_targets_mean": 3354.2,
"valid_targets_min": 916
},
{
"epoch": 3.740095087163233,
"grad_norm": 0.5875766220259515,
"learning_rate": 2.1113799738680254e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31163403391838074,
"step": 2360,
"valid_targets_mean": 4143.1,
"valid_targets_min": 1838
},
{
"epoch": 3.7480190174326466,
"grad_norm": 0.717473872317517,
"learning_rate": 2.103488012200583e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35403263568878174,
"step": 2365,
"valid_targets_mean": 3673.4,
"valid_targets_min": 1188
},
{
"epoch": 3.75594294770206,
"grad_norm": 0.7708312139810358,
"learning_rate": 2.095594434482491e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33274000883102417,
"step": 2370,
"valid_targets_mean": 3095.4,
"valid_targets_min": 1461
},
{
"epoch": 3.763866877971474,
"grad_norm": 0.6215656666692516,
"learning_rate": 2.0876993639784752e-05,
"loss": 0.3578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3734382092952728,
"step": 2375,
"valid_targets_mean": 4395.7,
"valid_targets_min": 1069
},
{
"epoch": 3.7717908082408877,
"grad_norm": 0.696852480633942,
"learning_rate": 2.0798029239765722e-05,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31851282715797424,
"step": 2380,
"valid_targets_mean": 3874.2,
"valid_targets_min": 1802
},
{
"epoch": 3.779714738510301,
"grad_norm": 0.6951396595704138,
"learning_rate": 2.0719052377862033e-05,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32077187299728394,
"step": 2385,
"valid_targets_mean": 3521.0,
"valid_targets_min": 1390
},
{
"epoch": 3.7876386687797146,
"grad_norm": 0.7195020532275461,
"learning_rate": 2.0640064287362525e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3314870297908783,
"step": 2390,
"valid_targets_mean": 3229.4,
"valid_targets_min": 1289
},
{
"epoch": 3.7955625990491284,
"grad_norm": 0.8180751679396766,
"learning_rate": 2.056106620173135e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3853730857372284,
"step": 2395,
"valid_targets_mean": 2613.6,
"valid_targets_min": 1336
},
{
"epoch": 3.8034865293185423,
"grad_norm": 0.733730511080735,
"learning_rate": 2.048205935458877e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32132023572921753,
"step": 2400,
"valid_targets_mean": 3179.6,
"valid_targets_min": 1221
},
{
"epoch": 3.8114104595879557,
"grad_norm": 0.6134570576672795,
"learning_rate": 2.0403044979691854e-05,
"loss": 0.3082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28578662872314453,
"step": 2405,
"valid_targets_mean": 3837.6,
"valid_targets_min": 1304
},
{
"epoch": 3.819334389857369,
"grad_norm": 0.7635018637295181,
"learning_rate": 2.032402431091522e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31944137811660767,
"step": 2410,
"valid_targets_mean": 2599.2,
"valid_targets_min": 1296
},
{
"epoch": 3.827258320126783,
"grad_norm": 0.7372264488783937,
"learning_rate": 2.0244998582231767e-05,
"loss": 0.3408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3162527084350586,
"step": 2415,
"valid_targets_mean": 2805.4,
"valid_targets_min": 1464
},
{
"epoch": 3.8351822503961968,
"grad_norm": 0.6531551753056782,
"learning_rate": 2.0165969027693425e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3599008321762085,
"step": 2420,
"valid_targets_mean": 4002.8,
"valid_targets_min": 1494
},
{
"epoch": 3.84310618066561,
"grad_norm": 0.8353501525186963,
"learning_rate": 2.008693688141185e-05,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3477362394332886,
"step": 2425,
"valid_targets_mean": 2357.6,
"valid_targets_min": 919
},
{
"epoch": 3.8510301109350236,
"grad_norm": 0.7088029576862485,
"learning_rate": 2.0007903377539187e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28312909603118896,
"step": 2430,
"valid_targets_mean": 3164.1,
"valid_targets_min": 1362
},
{
"epoch": 3.8589540412044374,
"grad_norm": 0.7274010885836312,
"learning_rate": 1.992886975024876e-05,
"loss": 0.337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31846240162849426,
"step": 2435,
"valid_targets_mean": 3024.1,
"valid_targets_min": 889
},
{
"epoch": 3.8668779714738513,
"grad_norm": 0.7833894784900323,
"learning_rate": 1.984983723371584e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3632742762565613,
"step": 2440,
"valid_targets_mean": 2629.2,
"valid_targets_min": 558
},
{
"epoch": 3.8748019017432647,
"grad_norm": 0.6668796876085389,
"learning_rate": 1.977080706209835e-05,
"loss": 0.3311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34540417790412903,
"step": 2445,
"valid_targets_mean": 3503.6,
"valid_targets_min": 1173
},
{
"epoch": 3.882725832012678,
"grad_norm": 0.7198481169885637,
"learning_rate": 1.9691780469517578e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3147124648094177,
"step": 2450,
"valid_targets_mean": 3361.3,
"valid_targets_min": 1502
},
{
"epoch": 3.890649762282092,
"grad_norm": 0.6225664648803466,
"learning_rate": 1.961275869003894e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.299946129322052,
"step": 2455,
"valid_targets_mean": 4080.0,
"valid_targets_min": 1743
},
{
"epoch": 3.8985736925515058,
"grad_norm": 0.586811491312213,
"learning_rate": 1.9533742957652683e-05,
"loss": 0.3253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30612677335739136,
"step": 2460,
"valid_targets_mean": 3907.0,
"valid_targets_min": 1502
},
{
"epoch": 3.906497622820919,
"grad_norm": 0.8015375291847339,
"learning_rate": 1.945473450625463e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3285152316093445,
"step": 2465,
"valid_targets_mean": 2799.4,
"valid_targets_min": 1124
},
{
"epoch": 3.9144215530903326,
"grad_norm": 0.7768068569253016,
"learning_rate": 1.9375734569626904e-05,
"loss": 0.3243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32465943694114685,
"step": 2470,
"valid_targets_mean": 2695.1,
"valid_targets_min": 1188
},
{
"epoch": 3.9223454833597464,
"grad_norm": 0.6903149189834576,
"learning_rate": 1.9296744381418653e-05,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3335050344467163,
"step": 2475,
"valid_targets_mean": 3702.8,
"valid_targets_min": 1403
},
{
"epoch": 3.9302694136291603,
"grad_norm": 0.674427230152727,
"learning_rate": 1.9217765175126808e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34546995162963867,
"step": 2480,
"valid_targets_mean": 3681.2,
"valid_targets_min": 1344
},
{
"epoch": 3.9381933438985737,
"grad_norm": 0.7615168910152336,
"learning_rate": 1.9138798184076805e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3379887342453003,
"step": 2485,
"valid_targets_mean": 2786.8,
"valid_targets_min": 665
},
{
"epoch": 3.946117274167987,
"grad_norm": 0.739627311408071,
"learning_rate": 1.9059844641403323e-05,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.337485134601593,
"step": 2490,
"valid_targets_mean": 2974.0,
"valid_targets_min": 1066
},
{
"epoch": 3.954041204437401,
"grad_norm": 0.7540616165257731,
"learning_rate": 1.898090578003104e-05,
"loss": 0.3316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3072323203086853,
"step": 2495,
"valid_targets_mean": 2595.8,
"valid_targets_min": 1021
},
{
"epoch": 3.9619651347068148,
"grad_norm": 0.849781819038183,
"learning_rate": 1.890198283265537e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33093464374542236,
"step": 2500,
"valid_targets_mean": 2223.1,
"valid_targets_min": 1112
},
{
"epoch": 3.969889064976228,
"grad_norm": 0.6623254756540252,
"learning_rate": 1.8823077031723217e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32428649067878723,
"step": 2505,
"valid_targets_mean": 3929.8,
"valid_targets_min": 1152
},
{
"epoch": 3.9778129952456416,
"grad_norm": 0.9088875770456144,
"learning_rate": 1.8744189609413733e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3459881544113159,
"step": 2510,
"valid_targets_mean": 2497.1,
"valid_targets_min": 1041
},
{
"epoch": 3.9857369255150554,
"grad_norm": 0.7118244141970165,
"learning_rate": 1.8665321797619068e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3549520969390869,
"step": 2515,
"valid_targets_mean": 3036.4,
"valid_targets_min": 1036
},
{
"epoch": 3.9936608557844693,
"grad_norm": 0.7872431081558173,
"learning_rate": 1.8586474827925142e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.343522310256958,
"step": 2520,
"valid_targets_mean": 3111.9,
"valid_targets_min": 934
},
{
"epoch": 4.001584786053883,
"grad_norm": 0.6333163189857594,
"learning_rate": 1.8507649931592405e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30445295572280884,
"step": 2525,
"valid_targets_mean": 3531.7,
"valid_targets_min": 1013
},
{
"epoch": 4.009508716323296,
"grad_norm": 0.6185313213820511,
"learning_rate": 1.8428848339536613e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28447040915489197,
"step": 2530,
"valid_targets_mean": 3920.8,
"valid_targets_min": 965
},
{
"epoch": 4.01743264659271,
"grad_norm": 1.632827555786203,
"learning_rate": 1.8350071282309606e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2971077561378479,
"step": 2535,
"valid_targets_mean": 3930.5,
"valid_targets_min": 1379
},
{
"epoch": 4.025356576862124,
"grad_norm": 0.7394593200985027,
"learning_rate": 1.8271319990080093e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2914736270904541,
"step": 2540,
"valid_targets_mean": 3326.8,
"valid_targets_min": 1293
},
{
"epoch": 4.033280507131537,
"grad_norm": 0.6319798264181055,
"learning_rate": 1.8192595692614445e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948256731033325,
"step": 2545,
"valid_targets_mean": 4935.4,
"valid_targets_min": 1569
},
{
"epoch": 4.041204437400951,
"grad_norm": 0.6195429750205664,
"learning_rate": 1.8113899619257487e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.259757399559021,
"step": 2550,
"valid_targets_mean": 3946.8,
"valid_targets_min": 1514
},
{
"epoch": 4.049128367670365,
"grad_norm": 0.8136555394477911,
"learning_rate": 1.8035232998913294e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3359217345714569,
"step": 2555,
"valid_targets_mean": 2811.3,
"valid_targets_min": 1053
},
{
"epoch": 4.057052297939778,
"grad_norm": 0.658978371503885,
"learning_rate": 1.795659706002602e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27853959798812866,
"step": 2560,
"valid_targets_mean": 3751.6,
"valid_targets_min": 1163
},
{
"epoch": 4.064976228209192,
"grad_norm": 0.7024991019538495,
"learning_rate": 1.7877993030560693e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3008027970790863,
"step": 2565,
"valid_targets_mean": 3564.5,
"valid_targets_min": 732
},
{
"epoch": 4.072900158478605,
"grad_norm": 0.9509196576152328,
"learning_rate": 1.7799422137984047e-05,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3372243642807007,
"step": 2570,
"valid_targets_mean": 2080.0,
"valid_targets_min": 1092
},
{
"epoch": 4.080824088748019,
"grad_norm": 0.8259571384452493,
"learning_rate": 1.772088560924536e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28471559286117554,
"step": 2575,
"valid_targets_mean": 2408.6,
"valid_targets_min": 1083
},
{
"epoch": 4.088748019017433,
"grad_norm": 0.8306440223043661,
"learning_rate": 1.76423846707573e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30105167627334595,
"step": 2580,
"valid_targets_mean": 2728.8,
"valid_targets_min": 1359
},
{
"epoch": 4.096671949286846,
"grad_norm": 0.7821004468315431,
"learning_rate": 1.756392054837675e-05,
"loss": 0.3321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35259807109832764,
"step": 2585,
"valid_targets_mean": 3060.4,
"valid_targets_min": 1256
},
{
"epoch": 4.10459587955626,
"grad_norm": 0.837278260105263,
"learning_rate": 1.7485494467385686e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2958485782146454,
"step": 2590,
"valid_targets_mean": 2570.9,
"valid_targets_min": 1177
},
{
"epoch": 4.112519809825674,
"grad_norm": 0.7450702161875221,
"learning_rate": 1.7407107652472034e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2652340531349182,
"step": 2595,
"valid_targets_mean": 2721.6,
"valid_targets_min": 988
},
{
"epoch": 4.120443740095087,
"grad_norm": 0.8272401230749654,
"learning_rate": 1.7328761327710545e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2961358428001404,
"step": 2600,
"valid_targets_mean": 2593.1,
"valid_targets_min": 1360
},
{
"epoch": 4.128367670364501,
"grad_norm": 1.2748656480073979,
"learning_rate": 1.7250456716543693e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31461167335510254,
"step": 2605,
"valid_targets_mean": 4279.6,
"valid_targets_min": 1170
},
{
"epoch": 4.136291600633914,
"grad_norm": 0.8167474006377758,
"learning_rate": 1.717219504176255e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3002293109893799,
"step": 2610,
"valid_targets_mean": 2615.6,
"valid_targets_min": 694
},
{
"epoch": 4.144215530903328,
"grad_norm": 0.7453906065684714,
"learning_rate": 1.7093977525487704e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31392133235931396,
"step": 2615,
"valid_targets_mean": 3305.8,
"valid_targets_min": 824
},
{
"epoch": 4.152139461172742,
"grad_norm": 0.70102708908017,
"learning_rate": 1.701580538915017e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3022012412548065,
"step": 2620,
"valid_targets_mean": 3455.0,
"valid_targets_min": 1731
},
{
"epoch": 4.160063391442155,
"grad_norm": 0.7192692867446561,
"learning_rate": 1.693767985347232e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26913607120513916,
"step": 2625,
"valid_targets_mean": 3015.6,
"valid_targets_min": 968
},
{
"epoch": 4.167987321711569,
"grad_norm": 0.7640141605128163,
"learning_rate": 1.6859602138448822e-05,
"loss": 0.3103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3088947534561157,
"step": 2630,
"valid_targets_mean": 3482.1,
"valid_targets_min": 814
},
{
"epoch": 4.175911251980983,
"grad_norm": 0.8117508775782821,
"learning_rate": 1.6781573463327573e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31718161702156067,
"step": 2635,
"valid_targets_mean": 2880.6,
"valid_targets_min": 1500
},
{
"epoch": 4.183835182250396,
"grad_norm": 0.7420422079275537,
"learning_rate": 1.6703595046590685e-05,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3003275394439697,
"step": 2640,
"valid_targets_mean": 3582.3,
"valid_targets_min": 1096
},
{
"epoch": 4.19175911251981,
"grad_norm": 0.7642707778816153,
"learning_rate": 1.662566810593544e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956918478012085,
"step": 2645,
"valid_targets_mean": 3331.7,
"valid_targets_min": 1139
},
{
"epoch": 4.199683042789223,
"grad_norm": 0.9108013010532445,
"learning_rate": 1.6547793858255275e-05,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3331553041934967,
"step": 2650,
"valid_targets_mean": 2406.9,
"valid_targets_min": 737
},
{
"epoch": 4.207606973058637,
"grad_norm": 0.6958301147034044,
"learning_rate": 1.646997351962078e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2943539023399353,
"step": 2655,
"valid_targets_mean": 3598.9,
"valid_targets_min": 1080
},
{
"epoch": 4.215530903328051,
"grad_norm": 0.8106867092367795,
"learning_rate": 1.639220830526072e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31939899921417236,
"step": 2660,
"valid_targets_mean": 2794.2,
"valid_targets_min": 826
},
{
"epoch": 4.223454833597464,
"grad_norm": 0.7722347258533244,
"learning_rate": 1.631449942954304e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992505133152008,
"step": 2665,
"valid_targets_mean": 3432.8,
"valid_targets_min": 791
},
{
"epoch": 4.231378763866878,
"grad_norm": 0.6605244498088375,
"learning_rate": 1.623684810595592e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26709267497062683,
"step": 2670,
"valid_targets_mean": 3478.2,
"valid_targets_min": 1440
},
{
"epoch": 4.239302694136292,
"grad_norm": 0.7294542403387982,
"learning_rate": 1.6159255547088806e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3037455081939697,
"step": 2675,
"valid_targets_mean": 3395.0,
"valid_targets_min": 908
},
{
"epoch": 4.247226624405705,
"grad_norm": 0.7747203263130421,
"learning_rate": 1.608172296461349e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3067532777786255,
"step": 2680,
"valid_targets_mean": 3267.0,
"valid_targets_min": 1247
},
{
"epoch": 4.255150554675119,
"grad_norm": 0.7171739409331684,
"learning_rate": 1.6004251569265187e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30375757813453674,
"step": 2685,
"valid_targets_mean": 3726.8,
"valid_targets_min": 1447
},
{
"epoch": 4.263074484944532,
"grad_norm": 0.6834444351988356,
"learning_rate": 1.5926842570823624e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29319584369659424,
"step": 2690,
"valid_targets_mean": 3729.8,
"valid_targets_min": 965
},
{
"epoch": 4.270998415213946,
"grad_norm": 0.8517435436774768,
"learning_rate": 1.5849497178094132e-05,
"loss": 0.3179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3134300410747528,
"step": 2695,
"valid_targets_mean": 2532.6,
"valid_targets_min": 987
},
{
"epoch": 4.27892234548336,
"grad_norm": 0.7775253010328972,
"learning_rate": 1.5772216598888802e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30423301458358765,
"step": 2700,
"valid_targets_mean": 2795.2,
"valid_targets_min": 742
},
{
"epoch": 4.286846275752773,
"grad_norm": 0.7218371372885936,
"learning_rate": 1.5695002040007613e-05,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007104992866516,
"step": 2705,
"valid_targets_mean": 3370.9,
"valid_targets_min": 944
},
{
"epoch": 4.294770206022187,
"grad_norm": 0.743546396207078,
"learning_rate": 1.5617854707219574e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31770211458206177,
"step": 2710,
"valid_targets_mean": 3224.2,
"valid_targets_min": 1224
},
{
"epoch": 4.302694136291601,
"grad_norm": 0.7458055587700105,
"learning_rate": 1.5540775805243896e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2979353368282318,
"step": 2715,
"valid_targets_mean": 2920.5,
"valid_targets_min": 1073
},
{
"epoch": 4.310618066561014,
"grad_norm": 0.7824000519774981,
"learning_rate": 1.5463766537731202e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33337557315826416,
"step": 2720,
"valid_targets_mean": 3077.6,
"valid_targets_min": 1114
},
{
"epoch": 4.318541996830428,
"grad_norm": 0.7518246296874621,
"learning_rate": 1.5386828107244705e-05,
"loss": 0.3089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896403670310974,
"step": 2725,
"valid_targets_mean": 3393.7,
"valid_targets_min": 1552
},
{
"epoch": 4.326465927099841,
"grad_norm": 0.648023364162129,
"learning_rate": 1.530996171524145e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30871593952178955,
"step": 2730,
"valid_targets_mean": 4109.9,
"valid_targets_min": 1139
},
{
"epoch": 4.334389857369255,
"grad_norm": 0.769692357957425,
"learning_rate": 1.5233168562053517e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2859308123588562,
"step": 2735,
"valid_targets_mean": 2917.9,
"valid_targets_min": 1157
},
{
"epoch": 4.342313787638669,
"grad_norm": 0.7237354504090463,
"learning_rate": 1.515644984686933e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3038594424724579,
"step": 2740,
"valid_targets_mean": 3344.9,
"valid_targets_min": 820
},
{
"epoch": 4.350237717908082,
"grad_norm": 0.7945130184832356,
"learning_rate": 1.507980676771489e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2981492877006531,
"step": 2745,
"valid_targets_mean": 2807.6,
"valid_targets_min": 906
},
{
"epoch": 4.358161648177496,
"grad_norm": 0.7902636448758641,
"learning_rate": 1.5003240521435076e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31415724754333496,
"step": 2750,
"valid_targets_mean": 2672.6,
"valid_targets_min": 746
},
{
"epoch": 4.36608557844691,
"grad_norm": 0.8020499365789604,
"learning_rate": 1.4926752303674967e-05,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36749058961868286,
"step": 2755,
"valid_targets_mean": 2934.5,
"valid_targets_min": 1510
},
{
"epoch": 4.374009508716323,
"grad_norm": 0.6976026655059031,
"learning_rate": 1.4850343308861152e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2690892815589905,
"step": 2760,
"valid_targets_mean": 3675.6,
"valid_targets_min": 1576
},
{
"epoch": 4.381933438985737,
"grad_norm": 0.8273604681356571,
"learning_rate": 1.47740147301831e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30167335271835327,
"step": 2765,
"valid_targets_mean": 2629.6,
"valid_targets_min": 989
},
{
"epoch": 4.38985736925515,
"grad_norm": 0.6544057381783281,
"learning_rate": 1.4697767759574508e-05,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769451141357422,
"step": 2770,
"valid_targets_mean": 4037.2,
"valid_targets_min": 1005
},
{
"epoch": 4.397781299524564,
"grad_norm": 0.8243154638778755,
"learning_rate": 1.4621603587694688e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.313541978597641,
"step": 2775,
"valid_targets_mean": 2701.2,
"valid_targets_min": 1603
},
{
"epoch": 4.405705229793978,
"grad_norm": 0.915560332977614,
"learning_rate": 1.454552340391e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3276725709438324,
"step": 2780,
"valid_targets_mean": 3331.5,
"valid_targets_min": 1087
},
{
"epoch": 4.413629160063391,
"grad_norm": 0.6485103596763808,
"learning_rate": 1.446952839627525e-05,
"loss": 0.3172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3232860565185547,
"step": 2785,
"valid_targets_mean": 4013.6,
"valid_targets_min": 1047
},
{
"epoch": 4.4215530903328055,
"grad_norm": 1.172378270754862,
"learning_rate": 1.4393619751515147e-05,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.308063268661499,
"step": 2790,
"valid_targets_mean": 2999.6,
"valid_targets_min": 1269
},
{
"epoch": 4.429477020602219,
"grad_norm": 0.768155820928126,
"learning_rate": 1.4317798655005777e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28411513566970825,
"step": 2795,
"valid_targets_mean": 3562.4,
"valid_targets_min": 323
},
{
"epoch": 4.437400950871632,
"grad_norm": 0.7875527455561598,
"learning_rate": 1.4242066290756084e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3191964328289032,
"step": 2800,
"valid_targets_mean": 3007.8,
"valid_targets_min": 1102
},
{
"epoch": 4.445324881141046,
"grad_norm": 0.7458242607802088,
"learning_rate": 1.4166423841389387e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2911447286605835,
"step": 2805,
"valid_targets_mean": 2887.9,
"valid_targets_min": 1028
},
{
"epoch": 4.453248811410459,
"grad_norm": 0.822647246509666,
"learning_rate": 1.4090872488124916e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307691752910614,
"step": 2810,
"valid_targets_mean": 2768.2,
"valid_targets_min": 536
},
{
"epoch": 4.461172741679873,
"grad_norm": 0.7771496896525412,
"learning_rate": 1.4015413410759343e-05,
"loss": 0.3249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3093550205230713,
"step": 2815,
"valid_targets_mean": 2895.3,
"valid_targets_min": 1313
},
{
"epoch": 4.469096671949287,
"grad_norm": 0.7655768531728774,
"learning_rate": 1.3940047787648388e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3004239797592163,
"step": 2820,
"valid_targets_mean": 2810.7,
"valid_targets_min": 913
},
{
"epoch": 4.4770206022187,
"grad_norm": 0.936481404258253,
"learning_rate": 1.3864776795688408e-05,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3504589796066284,
"step": 2825,
"valid_targets_mean": 3516.6,
"valid_targets_min": 1193
},
{
"epoch": 4.4849445324881145,
"grad_norm": 0.816980590525859,
"learning_rate": 1.3789601610298013e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.287618488073349,
"step": 2830,
"valid_targets_mean": 2968.8,
"valid_targets_min": 1097
},
{
"epoch": 4.492868462757528,
"grad_norm": 0.778268098745374,
"learning_rate": 1.3714523405399711e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3074689507484436,
"step": 2835,
"valid_targets_mean": 2911.4,
"valid_targets_min": 1061
},
{
"epoch": 4.500792393026941,
"grad_norm": 0.6573666416474037,
"learning_rate": 1.3639543353401588e-05,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2881685495376587,
"step": 2840,
"valid_targets_mean": 3663.2,
"valid_targets_min": 1408
},
{
"epoch": 4.508716323296355,
"grad_norm": 0.6941710441249608,
"learning_rate": 1.3564662625178979e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33653414249420166,
"step": 2845,
"valid_targets_mean": 3397.4,
"valid_targets_min": 681
},
{
"epoch": 4.516640253565768,
"grad_norm": 0.7863043325335887,
"learning_rate": 1.3489882390056214e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29496651887893677,
"step": 2850,
"valid_targets_mean": 2781.9,
"valid_targets_min": 1277
},
{
"epoch": 4.524564183835182,
"grad_norm": 0.8634068488077267,
"learning_rate": 1.3415203815788317e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2938062250614166,
"step": 2855,
"valid_targets_mean": 3095.8,
"valid_targets_min": 954
},
{
"epoch": 4.532488114104596,
"grad_norm": 0.7939512722364277,
"learning_rate": 1.3340628068542816e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2892675995826721,
"step": 2860,
"valid_targets_mean": 2929.0,
"valid_targets_min": 698
},
{
"epoch": 4.540412044374009,
"grad_norm": 0.8239988059278375,
"learning_rate": 1.3266156312881497e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29567891359329224,
"step": 2865,
"valid_targets_mean": 2818.6,
"valid_targets_min": 1250
},
{
"epoch": 4.5483359746434235,
"grad_norm": 0.8011210887144335,
"learning_rate": 1.3191789711742237e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970122694969177,
"step": 2870,
"valid_targets_mean": 2888.4,
"valid_targets_min": 1206
},
{
"epoch": 4.556259904912837,
"grad_norm": 0.6220168440568122,
"learning_rate": 1.3117529426420838e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3001657724380493,
"step": 2875,
"valid_targets_mean": 4320.4,
"valid_targets_min": 1126
},
{
"epoch": 4.56418383518225,
"grad_norm": 0.7549078864914368,
"learning_rate": 1.3043376616552889e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27980339527130127,
"step": 2880,
"valid_targets_mean": 3092.2,
"valid_targets_min": 942
},
{
"epoch": 4.572107765451664,
"grad_norm": 0.7620019128280029,
"learning_rate": 1.296933244009567e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31075483560562134,
"step": 2885,
"valid_targets_mean": 3096.1,
"valid_targets_min": 1150
},
{
"epoch": 4.580031695721077,
"grad_norm": 0.7628895287961468,
"learning_rate": 1.2895398053310053e-05,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894461154937744,
"step": 2890,
"valid_targets_mean": 3295.6,
"valid_targets_min": 636
},
{
"epoch": 4.5879556259904914,
"grad_norm": 0.9803486983305757,
"learning_rate": 1.2821574610742453e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31783849000930786,
"step": 2895,
"valid_targets_mean": 2410.8,
"valid_targets_min": 845
},
{
"epoch": 4.595879556259905,
"grad_norm": 0.672927388574443,
"learning_rate": 1.2747863265206801e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.308796763420105,
"step": 2900,
"valid_targets_mean": 3501.9,
"valid_targets_min": 868
},
{
"epoch": 4.603803486529318,
"grad_norm": 0.7279777785970651,
"learning_rate": 1.2674265167766545e-05,
"loss": 0.3101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28767889738082886,
"step": 2905,
"valid_targets_mean": 3142.7,
"valid_targets_min": 797
},
{
"epoch": 4.6117274167987325,
"grad_norm": 0.810766208206082,
"learning_rate": 1.2600781467716665e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3437730073928833,
"step": 2910,
"valid_targets_mean": 2790.1,
"valid_targets_min": 1091
},
{
"epoch": 4.619651347068146,
"grad_norm": 0.806232766113042,
"learning_rate": 1.2527413312565737e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30441755056381226,
"step": 2915,
"valid_targets_mean": 2803.9,
"valid_targets_min": 1041
},
{
"epoch": 4.627575277337559,
"grad_norm": 0.771054199386212,
"learning_rate": 1.2454161848018003e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31878095865249634,
"step": 2920,
"valid_targets_mean": 3022.9,
"valid_targets_min": 1210
},
{
"epoch": 4.635499207606973,
"grad_norm": 0.7455086622171665,
"learning_rate": 1.2381028217955486e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29189303517341614,
"step": 2925,
"valid_targets_mean": 3102.1,
"valid_targets_min": 832
},
{
"epoch": 4.643423137876387,
"grad_norm": 0.6813592554934786,
"learning_rate": 1.2308013564420132e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672593295574188,
"step": 2930,
"valid_targets_mean": 3894.0,
"valid_targets_min": 1700
},
{
"epoch": 4.6513470681458005,
"grad_norm": 0.7204804043327222,
"learning_rate": 1.2235119027595957e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32479286193847656,
"step": 2935,
"valid_targets_mean": 3971.2,
"valid_targets_min": 1352
},
{
"epoch": 4.659270998415214,
"grad_norm": 0.7638356280818674,
"learning_rate": 1.2162345745791268e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31609421968460083,
"step": 2940,
"valid_targets_mean": 3019.4,
"valid_targets_min": 977
},
{
"epoch": 4.667194928684627,
"grad_norm": 0.7039388185448092,
"learning_rate": 1.2089694855420873e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.287856787443161,
"step": 2945,
"valid_targets_mean": 3415.1,
"valid_targets_min": 1312
},
{
"epoch": 4.675118858954042,
"grad_norm": 0.7151331805533307,
"learning_rate": 1.201716749098833e-05,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898104190826416,
"step": 2950,
"valid_targets_mean": 3416.0,
"valid_targets_min": 1124
},
{
"epoch": 4.683042789223455,
"grad_norm": 1.9704639419589094,
"learning_rate": 1.1944764785068248e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3315780758857727,
"step": 2955,
"valid_targets_mean": 2883.4,
"valid_targets_min": 1348
},
{
"epoch": 4.690966719492868,
"grad_norm": 0.8156790243383886,
"learning_rate": 1.187248786828858e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3219088912010193,
"step": 2960,
"valid_targets_mean": 2594.6,
"valid_targets_min": 1422
},
{
"epoch": 4.698890649762282,
"grad_norm": 0.8039682183624894,
"learning_rate": 1.1800337869312988e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29908105731010437,
"step": 2965,
"valid_targets_mean": 2810.3,
"valid_targets_min": 1371
},
{
"epoch": 4.706814580031696,
"grad_norm": 0.8068691479781692,
"learning_rate": 1.17283159148232e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33075129985809326,
"step": 2970,
"valid_targets_mean": 2863.6,
"valid_targets_min": 1015
},
{
"epoch": 4.7147385103011095,
"grad_norm": 0.689486051910562,
"learning_rate": 1.165642312950142e-05,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2692754864692688,
"step": 2975,
"valid_targets_mean": 3604.5,
"valid_targets_min": 1605
},
{
"epoch": 4.722662440570523,
"grad_norm": 0.8268105603028824,
"learning_rate": 1.1584660636012788e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33773764967918396,
"step": 2980,
"valid_targets_mean": 3095.1,
"valid_targets_min": 947
},
{
"epoch": 4.730586370839936,
"grad_norm": 0.6575919589133923,
"learning_rate": 1.1513029554987804e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2386166751384735,
"step": 2985,
"valid_targets_mean": 4465.2,
"valid_targets_min": 1680
},
{
"epoch": 4.738510301109351,
"grad_norm": 0.6371132125962272,
"learning_rate": 1.144153100500488e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2862992286682129,
"step": 2990,
"valid_targets_mean": 3861.9,
"valid_targets_min": 1972
},
{
"epoch": 4.746434231378764,
"grad_norm": 0.7441439350640655,
"learning_rate": 1.1370166102572826e-05,
"loss": 0.3057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36143922805786133,
"step": 2995,
"valid_targets_mean": 3635.9,
"valid_targets_min": 1142
},
{
"epoch": 4.754358161648177,
"grad_norm": 0.6737445792645919,
"learning_rate": 1.1298935962113436e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2750626802444458,
"step": 3000,
"valid_targets_mean": 3542.1,
"valid_targets_min": 1289
},
{
"epoch": 4.762282091917591,
"grad_norm": 0.7212930569332857,
"learning_rate": 1.1227841695944104e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3105536699295044,
"step": 3005,
"valid_targets_mean": 3204.9,
"valid_targets_min": 1114
},
{
"epoch": 4.770206022187005,
"grad_norm": 0.6111875624664306,
"learning_rate": 1.1156884414260412e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29388630390167236,
"step": 3010,
"valid_targets_mean": 3729.1,
"valid_targets_min": 1208
},
{
"epoch": 4.7781299524564185,
"grad_norm": 0.764650461989785,
"learning_rate": 1.1086065225118836e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2933449447154999,
"step": 3015,
"valid_targets_mean": 3383.9,
"valid_targets_min": 984
},
{
"epoch": 4.786053882725832,
"grad_norm": 0.7224666416313265,
"learning_rate": 1.1015385234419402e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29492539167404175,
"step": 3020,
"valid_targets_mean": 3344.1,
"valid_targets_min": 906
},
{
"epoch": 4.793977812995245,
"grad_norm": 0.7948708382462361,
"learning_rate": 1.0944845545888462e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2928083539009094,
"step": 3025,
"valid_targets_mean": 2741.6,
"valid_targets_min": 1171
},
{
"epoch": 4.80190174326466,
"grad_norm": 0.7388242674514477,
"learning_rate": 1.0874447261061406e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3079679608345032,
"step": 3030,
"valid_targets_mean": 3113.4,
"valid_targets_min": 1405
},
{
"epoch": 4.809825673534073,
"grad_norm": 0.702881645128125,
"learning_rate": 1.0804191479265525e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2963460087776184,
"step": 3035,
"valid_targets_mean": 3467.6,
"valid_targets_min": 1365
},
{
"epoch": 4.817749603803486,
"grad_norm": 0.893930060872408,
"learning_rate": 1.0734079297602772e-05,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3658490777015686,
"step": 3040,
"valid_targets_mean": 2750.2,
"valid_targets_min": 1131
},
{
"epoch": 4.8256735340729,
"grad_norm": 0.6855561554316635,
"learning_rate": 1.0664111810932671e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28777241706848145,
"step": 3045,
"valid_targets_mean": 3720.5,
"valid_targets_min": 605
},
{
"epoch": 4.833597464342314,
"grad_norm": 0.7116370163557326,
"learning_rate": 1.0594290111855245e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32314878702163696,
"step": 3050,
"valid_targets_mean": 3834.8,
"valid_targets_min": 1553
},
{
"epoch": 4.8415213946117275,
"grad_norm": 0.8748328547962919,
"learning_rate": 1.0524615290693881e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3117261826992035,
"step": 3055,
"valid_targets_mean": 2272.6,
"valid_targets_min": 795
},
{
"epoch": 4.849445324881141,
"grad_norm": 0.7163896836836389,
"learning_rate": 1.0455088435478384e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054528832435608,
"step": 3060,
"valid_targets_mean": 3340.7,
"valid_targets_min": 685
},
{
"epoch": 4.857369255150554,
"grad_norm": 0.7990504060097595,
"learning_rate": 1.0385710631927917e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28801190853118896,
"step": 3065,
"valid_targets_mean": 2581.8,
"valid_targets_min": 852
},
{
"epoch": 4.865293185419969,
"grad_norm": 0.7858386332238347,
"learning_rate": 1.031648296343411e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30044302344322205,
"step": 3070,
"valid_targets_mean": 3524.5,
"valid_targets_min": 699
},
{
"epoch": 4.873217115689382,
"grad_norm": 0.7573279065310472,
"learning_rate": 1.0247406511044079e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34992167353630066,
"step": 3075,
"valid_targets_mean": 3097.5,
"valid_targets_min": 1330
},
{
"epoch": 4.881141045958795,
"grad_norm": 0.7999207340654183,
"learning_rate": 1.0178482353443588e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32113009691238403,
"step": 3080,
"valid_targets_mean": 2807.9,
"valid_targets_min": 1241
},
{
"epoch": 4.889064976228209,
"grad_norm": 0.849335113475438,
"learning_rate": 1.010971156694021e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3222789168357849,
"step": 3085,
"valid_targets_mean": 2970.4,
"valid_targets_min": 1106
},
{
"epoch": 4.896988906497623,
"grad_norm": 0.6823190767279323,
"learning_rate": 1.004109522544647e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27712273597717285,
"step": 3090,
"valid_targets_mean": 3440.9,
"valid_targets_min": 1461
},
{
"epoch": 4.9049128367670365,
"grad_norm": 0.7200895601882453,
"learning_rate": 9.972634400463135e-06,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2947770953178406,
"step": 3095,
"valid_targets_mean": 3490.6,
"valid_targets_min": 980
},
{
"epoch": 4.91283676703645,
"grad_norm": 0.6645038831235541,
"learning_rate": 9.90433016106243e-06,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31558895111083984,
"step": 3100,
"valid_targets_mean": 3618.5,
"valid_targets_min": 1104
},
{
"epoch": 4.920760697305864,
"grad_norm": 0.8119936304510853,
"learning_rate": 9.836183573871394e-06,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948872447013855,
"step": 3105,
"valid_targets_mean": 2676.7,
"valid_targets_min": 1118
},
{
"epoch": 4.928684627575278,
"grad_norm": 0.8117809416258112,
"learning_rate": 9.768195703055163e-06,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30462121963500977,
"step": 3110,
"valid_targets_mean": 2633.5,
"valid_targets_min": 1138
},
{
"epoch": 4.936608557844691,
"grad_norm": 0.7939054585691092,
"learning_rate": 9.700367610300423e-06,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3095425069332123,
"step": 3115,
"valid_targets_mean": 2848.7,
"valid_targets_min": 1131
},
{
"epoch": 4.944532488114104,
"grad_norm": 0.7205066824623103,
"learning_rate": 9.632700354798766e-06,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2746793031692505,
"step": 3120,
"valid_targets_mean": 3183.8,
"valid_targets_min": 1716
},
{
"epoch": 4.952456418383518,
"grad_norm": 0.8435432284739308,
"learning_rate": 9.565194993230176e-06,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33743882179260254,
"step": 3125,
"valid_targets_mean": 2504.1,
"valid_targets_min": 933
},
{
"epoch": 4.960380348652932,
"grad_norm": 0.7878822964478979,
"learning_rate": 9.49785257974656e-06,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2942264676094055,
"step": 3130,
"valid_targets_mean": 2571.7,
"valid_targets_min": 1017
},
{
"epoch": 4.9683042789223455,
"grad_norm": 0.8361868331960012,
"learning_rate": 9.430674165955218e-06,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34500449895858765,
"step": 3135,
"valid_targets_mean": 3657.2,
"valid_targets_min": 1331
},
{
"epoch": 4.976228209191759,
"grad_norm": 0.6974763936046318,
"learning_rate": 9.363660800902498e-06,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305804580450058,
"step": 3140,
"valid_targets_mean": 3425.0,
"valid_targets_min": 1135
},
{
"epoch": 4.984152139461173,
"grad_norm": 0.8185536692198196,
"learning_rate": 9.296813531057336e-06,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28771495819091797,
"step": 3145,
"valid_targets_mean": 2709.5,
"valid_targets_min": 1177
},
{
"epoch": 4.992076069730587,
"grad_norm": 0.78537077588257,
"learning_rate": 9.230133400294994e-06,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3354733884334564,
"step": 3150,
"valid_targets_mean": 2970.9,
"valid_targets_min": 1264
},
{
"epoch": 5.0,
"grad_norm": 0.7377919783129347,
"learning_rate": 9.163621449880686e-06,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2943228781223297,
"step": 3155,
"valid_targets_mean": 3264.5,
"valid_targets_min": 854
},
{
"epoch": 5.007923930269413,
"grad_norm": 0.6897294221365783,
"learning_rate": 9.097278718453366e-06,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24547956883907318,
"step": 3160,
"valid_targets_mean": 3132.8,
"valid_targets_min": 926
},
{
"epoch": 5.015847860538828,
"grad_norm": 0.7613434863732377,
"learning_rate": 9.0311062420095e-06,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28858259320259094,
"step": 3165,
"valid_targets_mean": 3152.6,
"valid_targets_min": 1006
},
{
"epoch": 5.023771790808241,
"grad_norm": 0.6810586489493294,
"learning_rate": 8.965105053886864e-06,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31911516189575195,
"step": 3170,
"valid_targets_mean": 4410.9,
"valid_targets_min": 1588
},
{
"epoch": 5.0316957210776545,
"grad_norm": 0.9023064359994762,
"learning_rate": 8.899276184748454e-06,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28767329454421997,
"step": 3175,
"valid_targets_mean": 2300.8,
"valid_targets_min": 824
},
{
"epoch": 5.039619651347068,
"grad_norm": 0.8159003566834867,
"learning_rate": 8.833620662566325e-06,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3218589127063751,
"step": 3180,
"valid_targets_mean": 3145.6,
"valid_targets_min": 1378
},
{
"epoch": 5.047543581616482,
"grad_norm": 0.805782943916796,
"learning_rate": 8.768139512605615e-06,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26077768206596375,
"step": 3185,
"valid_targets_mean": 3293.0,
"valid_targets_min": 434
},
{
"epoch": 5.055467511885896,
"grad_norm": 0.7270822754678393,
"learning_rate": 8.702833757408465e-06,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29586848616600037,
"step": 3190,
"valid_targets_mean": 3872.6,
"valid_targets_min": 1007
},
{
"epoch": 5.063391442155309,
"grad_norm": 0.8662314523284074,
"learning_rate": 8.637704416778106e-06,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25883880257606506,
"step": 3195,
"valid_targets_mean": 2555.5,
"valid_targets_min": 1255
},
{
"epoch": 5.071315372424722,
"grad_norm": 0.9893594514085089,
"learning_rate": 8.572752507762893e-06,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3071678876876831,
"step": 3200,
"valid_targets_mean": 2334.6,
"valid_targets_min": 1084
},
{
"epoch": 5.079239302694137,
"grad_norm": 0.7663852834514877,
"learning_rate": 8.50797904464044e-06,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2686847448348999,
"step": 3205,
"valid_targets_mean": 3020.4,
"valid_targets_min": 974
},
{
"epoch": 5.08716323296355,
"grad_norm": 0.8272623217334393,
"learning_rate": 8.443385038901801e-06,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090386390686035,
"step": 3210,
"valid_targets_mean": 2945.6,
"valid_targets_min": 1179
},
{
"epoch": 5.0950871632329635,
"grad_norm": 0.8759245976491827,
"learning_rate": 8.378971499235627e-06,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3076953887939453,
"step": 3215,
"valid_targets_mean": 2491.4,
"valid_targets_min": 786
},
{
"epoch": 5.103011093502377,
"grad_norm": 0.8719723671628756,
"learning_rate": 8.31473943151247e-06,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2724665105342865,
"step": 3220,
"valid_targets_mean": 2282.7,
"valid_targets_min": 729
},
{
"epoch": 5.110935023771791,
"grad_norm": 0.7575608712200748,
"learning_rate": 8.250689838769021e-06,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27652713656425476,
"step": 3225,
"valid_targets_mean": 3152.2,
"valid_targets_min": 1374
},
{
"epoch": 5.118858954041205,
"grad_norm": 0.7631967106769532,
"learning_rate": 8.186823721192505e-06,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2842700481414795,
"step": 3230,
"valid_targets_mean": 3138.7,
"valid_targets_min": 1766
},
{
"epoch": 5.126782884310618,
"grad_norm": 0.8153756836832209,
"learning_rate": 8.123142076105004e-06,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2878100275993347,
"step": 3235,
"valid_targets_mean": 2801.4,
"valid_targets_min": 1411
},
{
"epoch": 5.134706814580031,
"grad_norm": 0.8957597318522768,
"learning_rate": 8.05964589794791e-06,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3458958864212036,
"step": 3240,
"valid_targets_mean": 2559.4,
"valid_targets_min": 820
},
{
"epoch": 5.142630744849446,
"grad_norm": 0.7318674323785702,
"learning_rate": 7.996336178266422e-06,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2750980854034424,
"step": 3245,
"valid_targets_mean": 3455.2,
"valid_targets_min": 1764
},
{
"epoch": 5.150554675118859,
"grad_norm": 0.9159040940127984,
"learning_rate": 7.933213905694003e-06,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3370858132839203,
"step": 3250,
"valid_targets_mean": 2564.6,
"valid_targets_min": 901
},
{
"epoch": 5.1584786053882725,
"grad_norm": 0.7310111896825241,
"learning_rate": 7.87028006593701e-06,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27499884366989136,
"step": 3255,
"valid_targets_mean": 3558.4,
"valid_targets_min": 878
},
{
"epoch": 5.166402535657686,
"grad_norm": 0.6998508825943974,
"learning_rate": 7.807535641759229e-06,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2822907567024231,
"step": 3260,
"valid_targets_mean": 3665.8,
"valid_targets_min": 1305
},
{
"epoch": 5.1743264659271,
"grad_norm": 0.8038693569296806,
"learning_rate": 7.744981612966603e-06,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2702692151069641,
"step": 3265,
"valid_targets_mean": 3427.2,
"valid_targets_min": 1193
},
{
"epoch": 5.182250396196514,
"grad_norm": 0.8132637134761368,
"learning_rate": 7.682618956391854e-06,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.297921359539032,
"step": 3270,
"valid_targets_mean": 3114.1,
"valid_targets_min": 933
},
{
"epoch": 5.190174326465927,
"grad_norm": 0.9332356904299489,
"learning_rate": 7.62044864587931e-06,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29001176357269287,
"step": 3275,
"valid_targets_mean": 2984.0,
"valid_targets_min": 1307
},
{
"epoch": 5.19809825673534,
"grad_norm": 0.8407249660339803,
"learning_rate": 7.558471652269628e-06,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29336339235305786,
"step": 3280,
"valid_targets_mean": 3170.8,
"valid_targets_min": 955
},
{
"epoch": 5.206022187004755,
"grad_norm": 0.7286788825357956,
"learning_rate": 7.496688943384665e-06,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2957107424736023,
"step": 3285,
"valid_targets_mean": 3965.6,
"valid_targets_min": 699
},
{
"epoch": 5.213946117274168,
"grad_norm": 0.843729926958082,
"learning_rate": 7.435101484012377e-06,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26785874366760254,
"step": 3290,
"valid_targets_mean": 2523.9,
"valid_targets_min": 1106
},
{
"epoch": 5.2218700475435815,
"grad_norm": 0.7543573233989669,
"learning_rate": 7.37371023589172e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30548304319381714,
"step": 3295,
"valid_targets_mean": 3348.4,
"valid_targets_min": 1143
},
{
"epoch": 5.229793977812995,
"grad_norm": 0.8415736840199303,
"learning_rate": 7.312516157697671e-06,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32893145084381104,
"step": 3300,
"valid_targets_mean": 3006.1,
"valid_targets_min": 1188
},
{
"epoch": 5.237717908082409,
"grad_norm": 0.8688405311258023,
"learning_rate": 7.251520205026206e-06,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2774360775947571,
"step": 3305,
"valid_targets_mean": 2578.9,
"valid_targets_min": 917
},
{
"epoch": 5.245641838351823,
"grad_norm": 0.741755679162456,
"learning_rate": 7.190723330379441e-06,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26800817251205444,
"step": 3310,
"valid_targets_mean": 3866.8,
"valid_targets_min": 1128
},
{
"epoch": 5.253565768621236,
"grad_norm": 0.8672010632197062,
"learning_rate": 7.1301264831507034e-06,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30261340737342834,
"step": 3315,
"valid_targets_mean": 2493.1,
"valid_targets_min": 879
},
{
"epoch": 5.261489698890649,
"grad_norm": 0.7745233459137596,
"learning_rate": 7.0697306096097195e-06,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29366734623908997,
"step": 3320,
"valid_targets_mean": 3542.4,
"valid_targets_min": 1182
},
{
"epoch": 5.269413629160064,
"grad_norm": 0.7143335848995784,
"learning_rate": 7.0095366528878785e-06,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28641337156295776,
"step": 3325,
"valid_targets_mean": 3704.6,
"valid_targets_min": 1336
},
{
"epoch": 5.277337559429477,
"grad_norm": 0.8434525424449542,
"learning_rate": 6.949545552963432e-06,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28280267119407654,
"step": 3330,
"valid_targets_mean": 2677.4,
"valid_targets_min": 882
},
{
"epoch": 5.2852614896988905,
"grad_norm": 0.7211383167902913,
"learning_rate": 6.8897582466468935e-06,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23306918144226074,
"step": 3335,
"valid_targets_mean": 3320.4,
"valid_targets_min": 1214
},
{
"epoch": 5.293185419968304,
"grad_norm": 0.7978182833247313,
"learning_rate": 6.830175667566341e-06,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.315056711435318,
"step": 3340,
"valid_targets_mean": 2939.9,
"valid_targets_min": 1346
},
{
"epoch": 5.301109350237718,
"grad_norm": 0.7519981164582723,
"learning_rate": 6.770798746152889e-06,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27680274844169617,
"step": 3345,
"valid_targets_mean": 3183.6,
"valid_targets_min": 1318
},
{
"epoch": 5.309033280507132,
"grad_norm": 0.7260292170527266,
"learning_rate": 6.711628409626116e-06,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2554418444633484,
"step": 3350,
"valid_targets_mean": 3416.9,
"valid_targets_min": 936
},
{
"epoch": 5.316957210776545,
"grad_norm": 0.7180192291084321,
"learning_rate": 6.652665581979638e-06,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24962565302848816,
"step": 3355,
"valid_targets_mean": 3221.9,
"valid_targets_min": 1302
},
{
"epoch": 5.324881141045958,
"grad_norm": 0.8635374138802002,
"learning_rate": 6.593911183966619e-06,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3145523965358734,
"step": 3360,
"valid_targets_mean": 3000.2,
"valid_targets_min": 1210
},
{
"epoch": 5.332805071315373,
"grad_norm": 0.8699435358472265,
"learning_rate": 6.53536613308543e-06,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29066410660743713,
"step": 3365,
"valid_targets_mean": 2882.2,
"valid_targets_min": 1138
},
{
"epoch": 5.340729001584786,
"grad_norm": 0.7867640692640012,
"learning_rate": 6.477031343565332e-06,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29037970304489136,
"step": 3370,
"valid_targets_mean": 3145.4,
"valid_targets_min": 860
},
{
"epoch": 5.3486529318541995,
"grad_norm": 0.7507037278817914,
"learning_rate": 6.418907726352153e-06,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2885250449180603,
"step": 3375,
"valid_targets_mean": 3860.5,
"valid_targets_min": 1288
},
{
"epoch": 5.356576862123613,
"grad_norm": 0.7970118224353988,
"learning_rate": 6.36099618909412e-06,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26279422640800476,
"step": 3380,
"valid_targets_mean": 2864.9,
"valid_targets_min": 819
},
{
"epoch": 5.364500792393027,
"grad_norm": 0.7741426066555225,
"learning_rate": 6.303297636127627e-06,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27045324444770813,
"step": 3385,
"valid_targets_mean": 3207.2,
"valid_targets_min": 1124
},
{
"epoch": 5.372424722662441,
"grad_norm": 0.7127854092350832,
"learning_rate": 6.245812968463176e-06,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2626931369304657,
"step": 3390,
"valid_targets_mean": 3690.8,
"valid_targets_min": 1093
},
{
"epoch": 5.380348652931854,
"grad_norm": 0.7646869762243618,
"learning_rate": 6.188543083771237e-06,
"loss": 0.2981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27869051694869995,
"step": 3395,
"valid_targets_mean": 3124.8,
"valid_targets_min": 767
},
{
"epoch": 5.3882725832012675,
"grad_norm": 0.7964101106360405,
"learning_rate": 6.131488876368303e-06,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000558018684387,
"step": 3400,
"valid_targets_mean": 2870.7,
"valid_targets_min": 694
},
{
"epoch": 5.396196513470682,
"grad_norm": 0.9014007365513332,
"learning_rate": 6.074651237202862e-06,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2718481123447418,
"step": 3405,
"valid_targets_mean": 2537.0,
"valid_targets_min": 1225
},
{
"epoch": 5.404120443740095,
"grad_norm": 0.8463931416869477,
"learning_rate": 6.018031053841515e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30765998363494873,
"step": 3410,
"valid_targets_mean": 2869.0,
"valid_targets_min": 1410
},
{
"epoch": 5.4120443740095086,
"grad_norm": 0.776508481811668,
"learning_rate": 5.9616292104551266e-06,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28548675775527954,
"step": 3415,
"valid_targets_mean": 3247.4,
"valid_targets_min": 993
},
{
"epoch": 5.419968304278922,
"grad_norm": 0.8811837893257158,
"learning_rate": 5.905446587804977e-06,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3118222653865814,
"step": 3420,
"valid_targets_mean": 2474.4,
"valid_targets_min": 1138
},
{
"epoch": 5.427892234548336,
"grad_norm": 0.737052644355842,
"learning_rate": 5.849484063229065e-06,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26889342069625854,
"step": 3425,
"valid_targets_mean": 3359.2,
"valid_targets_min": 1296
},
{
"epoch": 5.43581616481775,
"grad_norm": 0.8075780098541901,
"learning_rate": 5.793742510628344e-06,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2839280366897583,
"step": 3430,
"valid_targets_mean": 2892.2,
"valid_targets_min": 1268
},
{
"epoch": 5.443740095087163,
"grad_norm": 0.7504122925838632,
"learning_rate": 5.738222800453139e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097327947616577,
"step": 3435,
"valid_targets_mean": 3614.0,
"valid_targets_min": 1553
},
{
"epoch": 5.4516640253565765,
"grad_norm": 0.7821341583753948,
"learning_rate": 5.682925799689498e-06,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30923694372177124,
"step": 3440,
"valid_targets_mean": 3298.6,
"valid_targets_min": 805
},
{
"epoch": 5.459587955625991,
"grad_norm": 0.842641770651966,
"learning_rate": 5.627852371845684e-06,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851231098175049,
"step": 3445,
"valid_targets_mean": 2770.8,
"valid_targets_min": 1158
},
{
"epoch": 5.467511885895404,
"grad_norm": 0.6353722332193599,
"learning_rate": 5.573003376938697e-06,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29435908794403076,
"step": 3450,
"valid_targets_mean": 3954.3,
"valid_targets_min": 1330
},
{
"epoch": 5.475435816164818,
"grad_norm": 0.7328969023306966,
"learning_rate": 5.518379671480813e-06,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865089178085327,
"step": 3455,
"valid_targets_mean": 3525.1,
"valid_targets_min": 823
},
{
"epoch": 5.483359746434231,
"grad_norm": 0.7860142473044672,
"learning_rate": 5.4639821084662455e-06,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29145336151123047,
"step": 3460,
"valid_targets_mean": 3054.6,
"valid_targets_min": 1382
},
{
"epoch": 5.491283676703645,
"grad_norm": 0.6910554226534089,
"learning_rate": 5.409811537357789e-06,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25137072801589966,
"step": 3465,
"valid_targets_mean": 3725.8,
"valid_targets_min": 1728
},
{
"epoch": 5.499207606973059,
"grad_norm": 0.8218007972441929,
"learning_rate": 5.355868804073594e-06,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28947368264198303,
"step": 3470,
"valid_targets_mean": 2976.0,
"valid_targets_min": 1010
},
{
"epoch": 5.507131537242472,
"grad_norm": 0.8486787865272499,
"learning_rate": 5.302154750973909e-06,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28270223736763,
"step": 3475,
"valid_targets_mean": 2702.1,
"valid_targets_min": 844
},
{
"epoch": 5.5150554675118855,
"grad_norm": 0.7386221051012911,
"learning_rate": 5.24867021684798e-06,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26117268204689026,
"step": 3480,
"valid_targets_mean": 2879.7,
"valid_targets_min": 1225
},
{
"epoch": 5.5229793977813,
"grad_norm": 0.8216354291445843,
"learning_rate": 5.195416036900906e-06,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26249247789382935,
"step": 3485,
"valid_targets_mean": 3457.2,
"valid_targets_min": 767
},
{
"epoch": 5.530903328050713,
"grad_norm": 1.2084085528993374,
"learning_rate": 5.142393042740617e-06,
"loss": 0.319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29814475774765015,
"step": 3490,
"valid_targets_mean": 3182.1,
"valid_targets_min": 305
},
{
"epoch": 5.538827258320127,
"grad_norm": 0.7634750141593889,
"learning_rate": 5.089602062364898e-06,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26985257863998413,
"step": 3495,
"valid_targets_mean": 2986.9,
"valid_targets_min": 1617
},
{
"epoch": 5.546751188589541,
"grad_norm": 0.6904822066759423,
"learning_rate": 5.037043920148434e-06,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2691362202167511,
"step": 3500,
"valid_targets_mean": 3526.2,
"valid_targets_min": 1080
},
{
"epoch": 5.554675118858954,
"grad_norm": 0.7735767982702189,
"learning_rate": 4.984719436829966e-06,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815571129322052,
"step": 3505,
"valid_targets_mean": 2997.6,
"valid_targets_min": 1134
},
{
"epoch": 5.562599049128368,
"grad_norm": 0.8692993197122556,
"learning_rate": 4.932629429499436e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33151981234550476,
"step": 3510,
"valid_targets_mean": 3003.9,
"valid_targets_min": 965
},
{
"epoch": 5.570522979397781,
"grad_norm": 0.7646591093883555,
"learning_rate": 4.880774711585276e-06,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31601202487945557,
"step": 3515,
"valid_targets_mean": 3189.0,
"valid_targets_min": 1157
},
{
"epoch": 5.5784469096671945,
"grad_norm": 0.8965877881561789,
"learning_rate": 4.829156092841663e-06,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32319316267967224,
"step": 3520,
"valid_targets_mean": 2551.0,
"valid_targets_min": 663
},
{
"epoch": 5.586370839936609,
"grad_norm": 0.8160633796116353,
"learning_rate": 4.777774379335885e-06,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3042828440666199,
"step": 3525,
"valid_targets_mean": 3296.0,
"valid_targets_min": 1741
},
{
"epoch": 5.594294770206022,
"grad_norm": 0.7884724935404464,
"learning_rate": 4.726630373435783e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717769145965576,
"step": 3530,
"valid_targets_mean": 2871.7,
"valid_targets_min": 1732
},
{
"epoch": 5.602218700475436,
"grad_norm": 0.7825057706764867,
"learning_rate": 4.675724873797171e-06,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26800742745399475,
"step": 3535,
"valid_targets_mean": 3067.4,
"valid_targets_min": 735
},
{
"epoch": 5.61014263074485,
"grad_norm": 0.9287978737031195,
"learning_rate": 4.625058675351415e-06,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33994632959365845,
"step": 3540,
"valid_targets_mean": 2602.8,
"valid_targets_min": 1256
},
{
"epoch": 5.618066561014263,
"grad_norm": 0.7094356128210746,
"learning_rate": 4.5746325692929735e-06,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2771075367927551,
"step": 3545,
"valid_targets_mean": 3757.5,
"valid_targets_min": 916
},
{
"epoch": 5.625990491283677,
"grad_norm": 0.6859542644396153,
"learning_rate": 4.524447343067089e-06,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2836745083332062,
"step": 3550,
"valid_targets_mean": 4243.0,
"valid_targets_min": 1365
},
{
"epoch": 5.63391442155309,
"grad_norm": 0.7767300135724696,
"learning_rate": 4.474503780357435e-06,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2820754647254944,
"step": 3555,
"valid_targets_mean": 2876.2,
"valid_targets_min": 742
},
{
"epoch": 5.6418383518225035,
"grad_norm": 0.7629257100358653,
"learning_rate": 4.424802661073946e-06,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27318716049194336,
"step": 3560,
"valid_targets_mean": 3280.9,
"valid_targets_min": 1270
},
{
"epoch": 5.649762282091918,
"grad_norm": 0.7934856602984349,
"learning_rate": 4.375344761340576e-06,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571597099304199,
"step": 3565,
"valid_targets_mean": 2402.7,
"valid_targets_min": 853
},
{
"epoch": 5.657686212361331,
"grad_norm": 0.8440924879483904,
"learning_rate": 4.326130853483206e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26417356729507446,
"step": 3570,
"valid_targets_mean": 2511.9,
"valid_targets_min": 1487
},
{
"epoch": 5.665610142630745,
"grad_norm": 0.7334809221953392,
"learning_rate": 4.277161706017605e-06,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28534117341041565,
"step": 3575,
"valid_targets_mean": 4596.6,
"valid_targets_min": 1402
},
{
"epoch": 5.673534072900159,
"grad_norm": 0.8738186406944687,
"learning_rate": 4.228438083637376e-06,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29095956683158875,
"step": 3580,
"valid_targets_mean": 3154.4,
"valid_targets_min": 996
},
{
"epoch": 5.681458003169572,
"grad_norm": 0.8033107801600781,
"learning_rate": 4.179960747202079e-06,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28336301445961,
"step": 3585,
"valid_targets_mean": 3012.1,
"valid_targets_min": 1565
},
{
"epoch": 5.689381933438986,
"grad_norm": 0.7721918898048784,
"learning_rate": 4.1317304537252804e-06,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260518342256546,
"step": 3590,
"valid_targets_mean": 3144.4,
"valid_targets_min": 981
},
{
"epoch": 5.697305863708399,
"grad_norm": 0.694223463065273,
"learning_rate": 4.0837479563627955e-06,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2553626298904419,
"step": 3595,
"valid_targets_mean": 3345.8,
"valid_targets_min": 1444
},
{
"epoch": 5.705229793977813,
"grad_norm": 0.6331316194608342,
"learning_rate": 4.03601400440089e-06,
"loss": 0.2821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2481665164232254,
"step": 3600,
"valid_targets_mean": 3937.8,
"valid_targets_min": 944
},
{
"epoch": 5.713153724247227,
"grad_norm": 0.7590163702300113,
"learning_rate": 3.988529343244573e-06,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28363344073295593,
"step": 3605,
"valid_targets_mean": 3357.2,
"valid_targets_min": 1556
},
{
"epoch": 5.72107765451664,
"grad_norm": 0.7862970467968567,
"learning_rate": 3.941294714406001e-06,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26843172311782837,
"step": 3610,
"valid_targets_mean": 2685.3,
"valid_targets_min": 1441
},
{
"epoch": 5.729001584786054,
"grad_norm": 0.811895324185377,
"learning_rate": 3.8943108554928396e-06,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29337239265441895,
"step": 3615,
"valid_targets_mean": 2627.5,
"valid_targets_min": 767
},
{
"epoch": 5.736925515055468,
"grad_norm": 0.7818395934035374,
"learning_rate": 3.8475785001968045e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30510663986206055,
"step": 3620,
"valid_targets_mean": 3426.6,
"valid_targets_min": 1372
},
{
"epoch": 5.744849445324881,
"grad_norm": 0.7237109014055133,
"learning_rate": 3.8010983782821464e-06,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25533539056777954,
"step": 3625,
"valid_targets_mean": 3133.6,
"valid_targets_min": 921
},
{
"epoch": 5.752773375594295,
"grad_norm": 0.723095303208419,
"learning_rate": 3.7548712155743096e-06,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870684862136841,
"step": 3630,
"valid_targets_mean": 3996.8,
"valid_targets_min": 942
},
{
"epoch": 5.760697305863708,
"grad_norm": 0.8844100592127758,
"learning_rate": 3.708897733948551e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29853054881095886,
"step": 3635,
"valid_targets_mean": 2297.3,
"valid_targets_min": 584
},
{
"epoch": 5.768621236133122,
"grad_norm": 0.7893659220405335,
"learning_rate": 3.6631786513187017e-06,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2839739918708801,
"step": 3640,
"valid_targets_mean": 3098.4,
"valid_targets_min": 1312
},
{
"epoch": 5.776545166402536,
"grad_norm": 0.7810985118615383,
"learning_rate": 3.617714681625939e-06,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2782176733016968,
"step": 3645,
"valid_targets_mean": 3081.3,
"valid_targets_min": 1199
},
{
"epoch": 5.784469096671949,
"grad_norm": 0.8015794756139869,
"learning_rate": 3.5725065348276332e-06,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28658199310302734,
"step": 3650,
"valid_targets_mean": 3216.1,
"valid_targets_min": 1163
},
{
"epoch": 5.792393026941363,
"grad_norm": 0.8065135711286809,
"learning_rate": 3.5275549168862843e-06,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3158048391342163,
"step": 3655,
"valid_targets_mean": 3061.4,
"valid_targets_min": 1504
},
{
"epoch": 5.800316957210777,
"grad_norm": 0.7907193883577602,
"learning_rate": 3.482860529758467e-06,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796323895454407,
"step": 3660,
"valid_targets_mean": 2935.3,
"valid_targets_min": 1241
},
{
"epoch": 5.80824088748019,
"grad_norm": 0.8415609267338444,
"learning_rate": 3.4384240713839034e-06,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3068225383758545,
"step": 3665,
"valid_targets_mean": 3065.4,
"valid_targets_min": 1341
},
{
"epoch": 5.816164817749604,
"grad_norm": 1.0611550853060565,
"learning_rate": 3.3942462356745188e-06,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.285479873418808,
"step": 3670,
"valid_targets_mean": 3949.0,
"valid_targets_min": 1399
},
{
"epoch": 5.824088748019017,
"grad_norm": 0.8018422821150991,
"learning_rate": 3.350327712503665e-06,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29329565167427063,
"step": 3675,
"valid_targets_mean": 3313.6,
"valid_targets_min": 672
},
{
"epoch": 5.832012678288431,
"grad_norm": 0.8030610419531269,
"learning_rate": 3.306669187695286e-06,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25516191124916077,
"step": 3680,
"valid_targets_mean": 2793.8,
"valid_targets_min": 1390
},
{
"epoch": 5.839936608557845,
"grad_norm": 0.761756852048967,
"learning_rate": 3.2632713430132502e-06,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2513202130794525,
"step": 3685,
"valid_targets_mean": 3200.6,
"valid_targets_min": 1081
},
{
"epoch": 5.847860538827258,
"grad_norm": 1.1902444568785213,
"learning_rate": 3.220134856150692e-06,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2957605719566345,
"step": 3690,
"valid_targets_mean": 2885.6,
"valid_targets_min": 834
},
{
"epoch": 5.855784469096672,
"grad_norm": 0.7866773610863317,
"learning_rate": 3.177260400719422e-06,
"loss": 0.295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28008750081062317,
"step": 3695,
"valid_targets_mean": 4172.1,
"valid_targets_min": 1492
},
{
"epoch": 5.863708399366086,
"grad_norm": 0.8126826054651635,
"learning_rate": 3.134648646239422e-06,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2800007462501526,
"step": 3700,
"valid_targets_mean": 2865.2,
"valid_targets_min": 1157
},
{
"epoch": 5.871632329635499,
"grad_norm": 0.7014430955558992,
"learning_rate": 3.092300258128369e-06,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2964010238647461,
"step": 3705,
"valid_targets_mean": 3767.6,
"valid_targets_min": 778
},
{
"epoch": 5.879556259904913,
"grad_norm": 0.9601998578307006,
"learning_rate": 3.0502158976912733e-06,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2710258960723877,
"step": 3710,
"valid_targets_mean": 2326.4,
"valid_targets_min": 1060
},
{
"epoch": 5.887480190174326,
"grad_norm": 0.8008616041237828,
"learning_rate": 3.0083962221101193e-06,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27677208185195923,
"step": 3715,
"valid_targets_mean": 2879.9,
"valid_targets_min": 1298
},
{
"epoch": 5.89540412044374,
"grad_norm": 0.7720062924445003,
"learning_rate": 2.9668418844336356e-06,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26314905285835266,
"step": 3720,
"valid_targets_mean": 3117.0,
"valid_targets_min": 1529
},
{
"epoch": 5.903328050713154,
"grad_norm": 0.964559252585821,
"learning_rate": 2.9255535335670673e-06,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30997902154922485,
"step": 3725,
"valid_targets_mean": 2333.3,
"valid_targets_min": 973
},
{
"epoch": 5.911251980982567,
"grad_norm": 0.863580039309836,
"learning_rate": 2.8845318142620526e-06,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3259606957435608,
"step": 3730,
"valid_targets_mean": 2724.1,
"valid_targets_min": 719
},
{
"epoch": 5.919175911251981,
"grad_norm": 0.7223684462952389,
"learning_rate": 2.8437773671065796e-06,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662881910800934,
"step": 3735,
"valid_targets_mean": 3433.8,
"valid_targets_min": 845
},
{
"epoch": 5.927099841521395,
"grad_norm": 0.8997397517104827,
"learning_rate": 2.803290828514935e-06,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2858402729034424,
"step": 3740,
"valid_targets_mean": 2252.3,
"valid_targets_min": 795
},
{
"epoch": 5.935023771790808,
"grad_norm": 1.257589056146217,
"learning_rate": 2.7630728307178166e-06,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3157416582107544,
"step": 3745,
"valid_targets_mean": 3201.3,
"valid_targets_min": 1047
},
{
"epoch": 5.942947702060222,
"grad_norm": 1.004305514240146,
"learning_rate": 2.723124001752415e-06,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.294961541891098,
"step": 3750,
"valid_targets_mean": 1967.2,
"valid_targets_min": 842
},
{
"epoch": 5.950871632329635,
"grad_norm": 0.9606671850132081,
"learning_rate": 2.6834449654526463e-06,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34209227561950684,
"step": 3755,
"valid_targets_mean": 2170.5,
"valid_targets_min": 720
},
{
"epoch": 5.958795562599049,
"grad_norm": 0.7957342434386907,
"learning_rate": 2.6440363414393776e-06,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978052496910095,
"step": 3760,
"valid_targets_mean": 2861.3,
"valid_targets_min": 1318
},
{
"epoch": 5.966719492868463,
"grad_norm": 0.906718243376995,
"learning_rate": 2.6048987451107667e-06,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34471917152404785,
"step": 3765,
"valid_targets_mean": 2459.7,
"valid_targets_min": 919
},
{
"epoch": 5.974643423137876,
"grad_norm": 0.9374249518211754,
"learning_rate": 2.5660327876326596e-06,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31891578435897827,
"step": 3770,
"valid_targets_mean": 2455.0,
"valid_targets_min": 949
},
{
"epoch": 5.9825673534072905,
"grad_norm": 0.7160565242876318,
"learning_rate": 2.527439075929028e-06,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.250852108001709,
"step": 3775,
"valid_targets_mean": 3327.8,
"valid_targets_min": 1186
},
{
"epoch": 5.990491283676704,
"grad_norm": 0.8255785273755935,
"learning_rate": 2.489118212672512e-06,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3088967204093933,
"step": 3780,
"valid_targets_mean": 2943.2,
"valid_targets_min": 800
},
{
"epoch": 5.998415213946117,
"grad_norm": 0.6942790595633246,
"learning_rate": 2.4510707962749813e-06,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31014499068260193,
"step": 3785,
"valid_targets_mean": 4262.9,
"valid_targets_min": 1053
},
{
"epoch": 6.006339144215531,
"grad_norm": 0.8405826416690129,
"learning_rate": 2.413297420878231e-06,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536356449127197,
"step": 3790,
"valid_targets_mean": 2973.3,
"valid_targets_min": 819
},
{
"epoch": 6.014263074484944,
"grad_norm": 0.9255627668051156,
"learning_rate": 2.375798676344652e-06,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3057909607887268,
"step": 3795,
"valid_targets_mean": 2337.0,
"valid_targets_min": 824
},
{
"epoch": 6.022187004754358,
"grad_norm": 0.7408039931277529,
"learning_rate": 2.338575148248077e-06,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2888672649860382,
"step": 3800,
"valid_targets_mean": 3384.5,
"valid_targets_min": 996
},
{
"epoch": 6.030110935023772,
"grad_norm": 0.744846896666886,
"learning_rate": 2.3016274178645826e-06,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2156473994255066,
"step": 3805,
"valid_targets_mean": 3281.6,
"valid_targets_min": 1175
},
{
"epoch": 6.038034865293185,
"grad_norm": 1.0372675808168368,
"learning_rate": 2.264956062163448e-06,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28580576181411743,
"step": 3810,
"valid_targets_mean": 3315.4,
"valid_targets_min": 1034
},
{
"epoch": 6.045958795562599,
"grad_norm": 0.7812177830894746,
"learning_rate": 2.2285616537981382e-06,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31875208020210266,
"step": 3815,
"valid_targets_mean": 3482.0,
"valid_targets_min": 825
},
{
"epoch": 6.053882725832013,
"grad_norm": 0.9237011609509943,
"learning_rate": 2.192444761097341e-06,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29322725534439087,
"step": 3820,
"valid_targets_mean": 2307.0,
"valid_targets_min": 842
},
{
"epoch": 6.061806656101426,
"grad_norm": 0.8990191236648827,
"learning_rate": 2.1566059480561276e-06,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766517698764801,
"step": 3825,
"valid_targets_mean": 2363.1,
"valid_targets_min": 941
},
{
"epoch": 6.06973058637084,
"grad_norm": 0.7361355418620003,
"learning_rate": 2.1210457743271173e-06,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930822968482971,
"step": 3830,
"valid_targets_mean": 3734.8,
"valid_targets_min": 1547
},
{
"epoch": 6.077654516640253,
"grad_norm": 0.9139892229625006,
"learning_rate": 2.085764795211742e-06,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2555992603302002,
"step": 3835,
"valid_targets_mean": 3034.4,
"valid_targets_min": 1277
},
{
"epoch": 6.085578446909667,
"grad_norm": 0.771123933373858,
"learning_rate": 2.0507635616515896e-06,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631310224533081,
"step": 3840,
"valid_targets_mean": 2985.9,
"valid_targets_min": 1237
},
{
"epoch": 6.093502377179081,
"grad_norm": 0.7897490876583761,
"learning_rate": 2.0160426202197782e-06,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618263363838196,
"step": 3845,
"valid_targets_mean": 3156.4,
"valid_targets_min": 1103
},
{
"epoch": 6.101426307448494,
"grad_norm": 0.7722775214717016,
"learning_rate": 1.981602513112446e-06,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24826066195964813,
"step": 3850,
"valid_targets_mean": 3438.9,
"valid_targets_min": 889
},
{
"epoch": 6.1093502377179085,
"grad_norm": 0.7058163459626046,
"learning_rate": 1.947443778140259e-06,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3340873420238495,
"step": 3855,
"valid_targets_mean": 4009.1,
"valid_targets_min": 613
},
{
"epoch": 6.117274167987322,
"grad_norm": 0.8569365221631509,
"learning_rate": 1.9135669487200404e-06,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29067397117614746,
"step": 3860,
"valid_targets_mean": 3074.8,
"valid_targets_min": 804
},
{
"epoch": 6.125198098256735,
"grad_norm": 0.7812766506289543,
"learning_rate": 1.8799725538664138e-06,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24928317964076996,
"step": 3865,
"valid_targets_mean": 3012.5,
"valid_targets_min": 756
},
{
"epoch": 6.133122028526149,
"grad_norm": 0.8199444138458281,
"learning_rate": 1.8466611181835504e-06,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26236987113952637,
"step": 3870,
"valid_targets_mean": 2752.6,
"valid_targets_min": 1398
},
{
"epoch": 6.141045958795562,
"grad_norm": 0.7536336080898335,
"learning_rate": 1.813633161856998e-06,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606717348098755,
"step": 3875,
"valid_targets_mean": 3515.2,
"valid_targets_min": 1170
},
{
"epoch": 6.148969889064976,
"grad_norm": 1.296674137353546,
"learning_rate": 1.7808892006455236e-06,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25334101915359497,
"step": 3880,
"valid_targets_mean": 3008.9,
"valid_targets_min": 959
},
{
"epoch": 6.15689381933439,
"grad_norm": 0.8549376573866226,
"learning_rate": 1.7484297458730903e-06,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27031368017196655,
"step": 3885,
"valid_targets_mean": 2541.9,
"valid_targets_min": 1088
},
{
"epoch": 6.164817749603803,
"grad_norm": 0.8660477974763549,
"learning_rate": 1.7162553044208397e-06,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27956318855285645,
"step": 3890,
"valid_targets_mean": 2584.7,
"valid_targets_min": 836
},
{
"epoch": 6.1727416798732175,
"grad_norm": 0.711909383806564,
"learning_rate": 1.6843663787192198e-06,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25135537981987,
"step": 3895,
"valid_targets_mean": 3468.3,
"valid_targets_min": 1001
},
{
"epoch": 6.180665610142631,
"grad_norm": 0.7256194141801523,
"learning_rate": 1.6527634667400905e-06,
"loss": 0.2794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2889530658721924,
"step": 3900,
"valid_targets_mean": 3539.7,
"valid_targets_min": 747
},
{
"epoch": 6.188589540412044,
"grad_norm": 0.89965843002777,
"learning_rate": 1.621447061988992e-06,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28266841173171997,
"step": 3905,
"valid_targets_mean": 2481.8,
"valid_targets_min": 1242
},
{
"epoch": 6.196513470681458,
"grad_norm": 0.6424467869924108,
"learning_rate": 1.5904176534974026e-06,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667967677116394,
"step": 3910,
"valid_targets_mean": 4722.1,
"valid_targets_min": 1482
},
{
"epoch": 6.204437400950872,
"grad_norm": 0.7166598681182121,
"learning_rate": 1.559675725815124e-06,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644422650337219,
"step": 3915,
"valid_targets_mean": 3448.1,
"valid_targets_min": 1400
},
{
"epoch": 6.212361331220285,
"grad_norm": 0.6883227021978096,
"learning_rate": 1.5292217590027126e-06,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2776218056678772,
"step": 3920,
"valid_targets_mean": 3848.3,
"valid_targets_min": 1314
},
{
"epoch": 6.220285261489699,
"grad_norm": 0.8216293331586425,
"learning_rate": 1.4990562286239651e-06,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27567949891090393,
"step": 3925,
"valid_targets_mean": 2947.2,
"valid_targets_min": 1357
},
{
"epoch": 6.228209191759112,
"grad_norm": 0.8066020986178258,
"learning_rate": 1.4691796057385222e-06,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32604455947875977,
"step": 3930,
"valid_targets_mean": 3126.6,
"valid_targets_min": 1571
},
{
"epoch": 6.2361331220285265,
"grad_norm": 0.7786528543223891,
"learning_rate": 1.4395923568944792e-06,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2671036422252655,
"step": 3935,
"valid_targets_mean": 3246.4,
"valid_targets_min": 720
},
{
"epoch": 6.24405705229794,
"grad_norm": 0.720991179266921,
"learning_rate": 1.4102949441211333e-06,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2621596157550812,
"step": 3940,
"valid_targets_mean": 3775.2,
"valid_targets_min": 1717
},
{
"epoch": 6.251980982567353,
"grad_norm": 0.8635951163563789,
"learning_rate": 1.3812878249217375e-06,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2590984106063843,
"step": 3945,
"valid_targets_mean": 2491.5,
"valid_targets_min": 830
},
{
"epoch": 6.259904912836767,
"grad_norm": 0.8055705967233836,
"learning_rate": 1.3525714522663802e-06,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2969766855239868,
"step": 3950,
"valid_targets_mean": 3152.1,
"valid_targets_min": 1546
},
{
"epoch": 6.267828843106181,
"grad_norm": 0.8212779657990703,
"learning_rate": 1.3241462745849032e-06,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2703918516635895,
"step": 3955,
"valid_targets_mean": 2716.7,
"valid_targets_min": 1124
},
{
"epoch": 6.2757527733755945,
"grad_norm": 0.7792393371884195,
"learning_rate": 1.2960127357598907e-06,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29034721851348877,
"step": 3960,
"valid_targets_mean": 3387.6,
"valid_targets_min": 1440
},
{
"epoch": 6.283676703645008,
"grad_norm": 0.7746891412107202,
"learning_rate": 1.2681712751197561e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27121007442474365,
"step": 3965,
"valid_targets_mean": 3463.2,
"valid_targets_min": 1184
},
{
"epoch": 6.291600633914421,
"grad_norm": 0.7782249097983254,
"learning_rate": 1.2406223274318619e-06,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2974588871002197,
"step": 3970,
"valid_targets_mean": 3313.4,
"valid_targets_min": 1128
},
{
"epoch": 6.2995245641838356,
"grad_norm": 0.7412856374389678,
"learning_rate": 1.2133663228957483e-06,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2881653606891632,
"step": 3975,
"valid_targets_mean": 3866.8,
"valid_targets_min": 1073
},
{
"epoch": 6.307448494453249,
"grad_norm": 0.8312977029113554,
"learning_rate": 1.186403687136397e-06,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27708035707473755,
"step": 3980,
"valid_targets_mean": 3342.8,
"valid_targets_min": 933
},
{
"epoch": 6.315372424722662,
"grad_norm": 0.8197541649986204,
"learning_rate": 1.1597348411976038e-06,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2698556184768677,
"step": 3985,
"valid_targets_mean": 3237.8,
"valid_targets_min": 951
},
{
"epoch": 6.323296354992076,
"grad_norm": 0.8471159114422045,
"learning_rate": 1.1333602015353896e-06,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26829445362091064,
"step": 3990,
"valid_targets_mean": 3004.6,
"valid_targets_min": 928
},
{
"epoch": 6.33122028526149,
"grad_norm": 0.7503125828764259,
"learning_rate": 1.1072801800114985e-06,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2777388393878937,
"step": 3995,
"valid_targets_mean": 3267.4,
"valid_targets_min": 947
},
{
"epoch": 6.3391442155309035,
"grad_norm": 0.8175380063542717,
"learning_rate": 1.0814951838869758e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3123356103897095,
"step": 4000,
"valid_targets_mean": 2992.7,
"valid_targets_min": 950
},
{
"epoch": 6.347068145800317,
"grad_norm": 0.6162025832470477,
"learning_rate": 1.0560056158157938e-06,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2392377257347107,
"step": 4005,
"valid_targets_mean": 4391.2,
"valid_targets_min": 1106
},
{
"epoch": 6.35499207606973,
"grad_norm": 0.7072834519407339,
"learning_rate": 1.0308118738385865e-06,
"loss": 0.2742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674199938774109,
"step": 4010,
"valid_targets_mean": 4024.9,
"valid_targets_min": 832
},
{
"epoch": 6.362916006339145,
"grad_norm": 0.7287197281341509,
"learning_rate": 1.0059143513764003e-06,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2720893621444702,
"step": 4015,
"valid_targets_mean": 3626.2,
"valid_targets_min": 1144
},
{
"epoch": 6.370839936608558,
"grad_norm": 0.7782133569731706,
"learning_rate": 9.81313437224587e-07,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2739805579185486,
"step": 4020,
"valid_targets_mean": 3153.7,
"valid_targets_min": 1323
},
{
"epoch": 6.378763866877971,
"grad_norm": 1.0460021255922092,
"learning_rate": 9.57009515546703e-07,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28859415650367737,
"step": 4025,
"valid_targets_mean": 3569.7,
"valid_targets_min": 724
},
{
"epoch": 6.386687797147385,
"grad_norm": 0.7562261910777165,
"learning_rate": 9.330029658685302e-07,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27344030141830444,
"step": 4030,
"valid_targets_mean": 3449.7,
"valid_targets_min": 1592
},
{
"epoch": 6.394611727416799,
"grad_norm": 0.8544761844509305,
"learning_rate": 9.092941630721363e-07,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29668188095092773,
"step": 4035,
"valid_targets_mean": 2992.6,
"valid_targets_min": 1013
},
{
"epoch": 6.4025356576862125,
"grad_norm": 0.6668053311414428,
"learning_rate": 8.85883477390026e-07,
"loss": 0.2447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24657505750656128,
"step": 4040,
"valid_targets_mean": 3835.4,
"valid_targets_min": 1336
},
{
"epoch": 6.410459587955626,
"grad_norm": 0.7216857447286184,
"learning_rate": 8.627712743993655e-07,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2436390221118927,
"step": 4045,
"valid_targets_mean": 3372.4,
"valid_targets_min": 1404
},
{
"epoch": 6.418383518225039,
"grad_norm": 1.0127403923030123,
"learning_rate": 8.399579150162585e-07,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674424648284912,
"step": 4050,
"valid_targets_mean": 3369.4,
"valid_targets_min": 1352
},
{
"epoch": 6.426307448494454,
"grad_norm": 0.8241874728542988,
"learning_rate": 8.174437554901304e-07,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.262814462184906,
"step": 4055,
"valid_targets_mean": 3054.7,
"valid_targets_min": 967
},
{
"epoch": 6.434231378763867,
"grad_norm": 0.7415633298787859,
"learning_rate": 7.9522914739814e-07,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257989764213562,
"step": 4060,
"valid_targets_mean": 3583.1,
"valid_targets_min": 1582
},
{
"epoch": 6.44215530903328,
"grad_norm": 0.7949440857800341,
"learning_rate": 7.733144376397184e-07,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28058376908302307,
"step": 4065,
"valid_targets_mean": 2917.6,
"valid_targets_min": 969
},
{
"epoch": 6.450079239302694,
"grad_norm": 0.7943902641247984,
"learning_rate": 7.516999684311277e-07,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26108643412590027,
"step": 4070,
"valid_targets_mean": 3074.9,
"valid_targets_min": 904
},
{
"epoch": 6.458003169572108,
"grad_norm": 0.8282850201666918,
"learning_rate": 7.303860773001248e-07,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2973766624927521,
"step": 4075,
"valid_targets_mean": 3289.0,
"valid_targets_min": 1388
},
{
"epoch": 6.4659270998415215,
"grad_norm": 0.8612035667904403,
"learning_rate": 7.093730970807034e-07,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2724660336971283,
"step": 4080,
"valid_targets_mean": 2506.1,
"valid_targets_min": 1134
},
{
"epoch": 6.473851030110935,
"grad_norm": 0.7705878492600347,
"learning_rate": 6.88661355907867e-07,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2626793384552002,
"step": 4085,
"valid_targets_mean": 3173.4,
"valid_targets_min": 1241
},
{
"epoch": 6.481774960380348,
"grad_norm": 0.8293774983470878,
"learning_rate": 6.682511772125422e-07,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2623213529586792,
"step": 4090,
"valid_targets_mean": 2695.9,
"valid_targets_min": 1083
},
{
"epoch": 6.489698890649763,
"grad_norm": 0.7185734573332064,
"learning_rate": 6.481428797164957e-07,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2767176628112793,
"step": 4095,
"valid_targets_mean": 3695.9,
"valid_targets_min": 1610
},
{
"epoch": 6.497622820919176,
"grad_norm": 0.7192376832208326,
"learning_rate": 6.283367774273785e-07,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2640265226364136,
"step": 4100,
"valid_targets_mean": 3505.2,
"valid_targets_min": 749
},
{
"epoch": 6.505546751188589,
"grad_norm": 0.7821908648146034,
"learning_rate": 6.088331796338032e-07,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534036934375763,
"step": 4105,
"valid_targets_mean": 3527.4,
"valid_targets_min": 1362
},
{
"epoch": 6.513470681458003,
"grad_norm": 0.8284059543758624,
"learning_rate": 5.896323909005408e-07,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2960991859436035,
"step": 4110,
"valid_targets_mean": 2956.4,
"valid_targets_min": 1221
},
{
"epoch": 6.521394611727417,
"grad_norm": 0.7318982088006352,
"learning_rate": 5.707347110637363e-07,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784423530101776,
"step": 4115,
"valid_targets_mean": 3589.7,
"valid_targets_min": 1266
},
{
"epoch": 6.5293185419968305,
"grad_norm": 0.8037460574946733,
"learning_rate": 5.521404352262427e-07,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540718913078308,
"step": 4120,
"valid_targets_mean": 3112.4,
"valid_targets_min": 809
},
{
"epoch": 6.537242472266244,
"grad_norm": 0.8562375564350958,
"learning_rate": 5.338498537530146e-07,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2838800549507141,
"step": 4125,
"valid_targets_mean": 2713.3,
"valid_targets_min": 613
},
{
"epoch": 6.545166402535658,
"grad_norm": 0.8404101038916709,
"learning_rate": 5.158632522665619e-07,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27864933013916016,
"step": 4130,
"valid_targets_mean": 2579.3,
"valid_targets_min": 1006
},
{
"epoch": 6.553090332805072,
"grad_norm": 0.8903943414798002,
"learning_rate": 4.981809116424985e-07,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.276671826839447,
"step": 4135,
"valid_targets_mean": 2540.3,
"valid_targets_min": 735
},
{
"epoch": 6.561014263074485,
"grad_norm": 0.7783873275285311,
"learning_rate": 4.808031080051545e-07,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29601848125457764,
"step": 4140,
"valid_targets_mean": 3532.1,
"valid_targets_min": 987
},
{
"epoch": 6.568938193343898,
"grad_norm": 0.8487222802895167,
"learning_rate": 4.637301127232663e-07,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2824670672416687,
"step": 4145,
"valid_targets_mean": 2751.2,
"valid_targets_min": 1035
},
{
"epoch": 6.576862123613312,
"grad_norm": 0.7810288925443892,
"learning_rate": 4.4696219240573327e-07,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29629069566726685,
"step": 4150,
"valid_targets_mean": 3234.6,
"valid_targets_min": 1025
},
{
"epoch": 6.584786053882726,
"grad_norm": 0.6639163886957854,
"learning_rate": 4.3049960889745666e-07,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2679304778575897,
"step": 4155,
"valid_targets_mean": 4046.2,
"valid_targets_min": 2034
},
{
"epoch": 6.5927099841521395,
"grad_norm": 0.766246752720584,
"learning_rate": 4.143426192752542e-07,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2746524214744568,
"step": 4160,
"valid_targets_mean": 3666.3,
"valid_targets_min": 1545
},
{
"epoch": 6.600633914421553,
"grad_norm": 0.8536786529200687,
"learning_rate": 3.984914758438407e-07,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148544728755951,
"step": 4165,
"valid_targets_mean": 3556.8,
"valid_targets_min": 502
},
{
"epoch": 6.608557844690967,
"grad_norm": 0.8388466221341304,
"learning_rate": 3.8294642613189603e-07,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2988848388195038,
"step": 4170,
"valid_targets_mean": 3141.4,
"valid_targets_min": 1034
},
{
"epoch": 6.616481774960381,
"grad_norm": 0.8546205962148445,
"learning_rate": 3.6770771288818563e-07,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2964688539505005,
"step": 4175,
"valid_targets_mean": 2680.8,
"valid_targets_min": 1146
},
{
"epoch": 6.624405705229794,
"grad_norm": 0.6352285540163427,
"learning_rate": 3.5277557407778605e-07,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26553648710250854,
"step": 4180,
"valid_targets_mean": 4059.6,
"valid_targets_min": 1237
},
{
"epoch": 6.632329635499207,
"grad_norm": 0.9620640961546393,
"learning_rate": 3.3815024287835895e-07,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3085815906524658,
"step": 4185,
"valid_targets_mean": 2293.6,
"valid_targets_min": 768
},
{
"epoch": 6.640253565768621,
"grad_norm": 0.7540474372071029,
"learning_rate": 3.2383194767650947e-07,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257649302482605,
"step": 4190,
"valid_targets_mean": 3436.9,
"valid_targets_min": 1402
},
{
"epoch": 6.648177496038035,
"grad_norm": 0.8249666226190281,
"learning_rate": 3.098209120642248e-07,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894267737865448,
"step": 4195,
"valid_targets_mean": 3102.8,
"valid_targets_min": 1485
},
{
"epoch": 6.6561014263074485,
"grad_norm": 0.7985618899920006,
"learning_rate": 2.9611735483537684e-07,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29402169585227966,
"step": 4200,
"valid_targets_mean": 3086.1,
"valid_targets_min": 923
},
{
"epoch": 6.664025356576862,
"grad_norm": 0.7971335823491561,
"learning_rate": 2.827214899823183e-07,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28697848320007324,
"step": 4205,
"valid_targets_mean": 3342.2,
"valid_targets_min": 1271
},
{
"epoch": 6.671949286846276,
"grad_norm": 0.9626143965275245,
"learning_rate": 2.6963352669252095e-07,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29628515243530273,
"step": 4210,
"valid_targets_mean": 2125.6,
"valid_targets_min": 698
},
{
"epoch": 6.67987321711569,
"grad_norm": 0.7980141278149887,
"learning_rate": 2.568536693453272e-07,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726362943649292,
"step": 4215,
"valid_targets_mean": 2887.1,
"valid_targets_min": 1048
},
{
"epoch": 6.687797147385103,
"grad_norm": 0.8055430110182665,
"learning_rate": 2.443821175087435e-07,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2402665913105011,
"step": 4220,
"valid_targets_mean": 2865.8,
"valid_targets_min": 1197
},
{
"epoch": 6.695721077654516,
"grad_norm": 0.8616251532210281,
"learning_rate": 2.3221906593634102e-07,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2799178957939148,
"step": 4225,
"valid_targets_mean": 3122.3,
"valid_targets_min": 1305
},
{
"epoch": 6.70364500792393,
"grad_norm": 0.774098085179844,
"learning_rate": 2.2036470456419767e-07,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32133832573890686,
"step": 4230,
"valid_targets_mean": 3208.2,
"valid_targets_min": 1505
},
{
"epoch": 6.711568938193344,
"grad_norm": 0.7956195714820337,
"learning_rate": 2.088192185079385e-07,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26833003759384155,
"step": 4235,
"valid_targets_mean": 2955.7,
"valid_targets_min": 1027
},
{
"epoch": 6.7194928684627575,
"grad_norm": 0.8577430299273257,
"learning_rate": 1.9758278805985574e-07,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32463526725769043,
"step": 4240,
"valid_targets_mean": 2802.4,
"valid_targets_min": 1128
},
{
"epoch": 6.727416798732171,
"grad_norm": 0.6783344453017468,
"learning_rate": 1.8665558868607325e-07,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2513703405857086,
"step": 4245,
"valid_targets_mean": 3795.2,
"valid_targets_min": 1668
},
{
"epoch": 6.735340729001585,
"grad_norm": 0.6750719706575818,
"learning_rate": 1.760377910238198e-07,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2817671597003937,
"step": 4250,
"valid_targets_mean": 3822.6,
"valid_targets_min": 917
},
{
"epoch": 6.743264659270999,
"grad_norm": 0.7810619939316714,
"learning_rate": 1.6572956087876014e-07,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29501527547836304,
"step": 4255,
"valid_targets_mean": 3182.8,
"valid_targets_min": 1080
},
{
"epoch": 6.751188589540412,
"grad_norm": 0.9970801859894827,
"learning_rate": 1.5573105922241037e-07,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3328208327293396,
"step": 4260,
"valid_targets_mean": 2217.5,
"valid_targets_min": 1062
},
{
"epoch": 6.759112519809825,
"grad_norm": 0.7526770442896775,
"learning_rate": 1.4604244218962005e-07,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2694515585899353,
"step": 4265,
"valid_targets_mean": 3435.8,
"valid_targets_min": 1346
},
{
"epoch": 6.767036450079239,
"grad_norm": 0.8154643867852098,
"learning_rate": 1.3666386107613173e-07,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26164501905441284,
"step": 4270,
"valid_targets_mean": 2867.2,
"valid_targets_min": 955
},
{
"epoch": 6.774960380348653,
"grad_norm": 0.9005705221401481,
"learning_rate": 1.2759546233622299e-07,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304414302110672,
"step": 4275,
"valid_targets_mean": 2569.8,
"valid_targets_min": 906
},
{
"epoch": 6.7828843106180665,
"grad_norm": 0.9123716561532796,
"learning_rate": 1.1883738758041941e-07,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289928138256073,
"step": 4280,
"valid_targets_mean": 2864.4,
"valid_targets_min": 683
},
{
"epoch": 6.79080824088748,
"grad_norm": 0.735049289630845,
"learning_rate": 1.1038977357328063e-07,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669024169445038,
"step": 4285,
"valid_targets_mean": 3456.4,
"valid_targets_min": 913
},
{
"epoch": 6.798732171156894,
"grad_norm": 0.7856993252453753,
"learning_rate": 1.0225275223126219e-07,
"loss": 0.2731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780317962169647,
"step": 4290,
"valid_targets_mean": 3268.8,
"valid_targets_min": 1330
},
{
"epoch": 6.806656101426308,
"grad_norm": 0.800287247624352,
"learning_rate": 9.442645062066602e-08,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28255707025527954,
"step": 4295,
"valid_targets_mean": 3144.7,
"valid_targets_min": 1186
},
{
"epoch": 6.814580031695721,
"grad_norm": 0.7997304917655168,
"learning_rate": 8.691099095564426e-08,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793860137462616,
"step": 4300,
"valid_targets_mean": 3157.3,
"valid_targets_min": 1311
},
{
"epoch": 6.822503961965134,
"grad_norm": 0.7116056078586471,
"learning_rate": 7.970649059629853e-08,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3179277777671814,
"step": 4305,
"valid_targets_mean": 4103.9,
"valid_targets_min": 1133
},
{
"epoch": 6.830427892234549,
"grad_norm": 0.7338611892910522,
"learning_rate": 7.281306204684147e-08,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25144636631011963,
"step": 4310,
"valid_targets_mean": 3348.8,
"valid_targets_min": 1437
},
{
"epoch": 6.838351822503962,
"grad_norm": 0.7686317688403141,
"learning_rate": 6.623081295384248e-08,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780628800392151,
"step": 4315,
"valid_targets_mean": 3222.4,
"valid_targets_min": 1381
},
{
"epoch": 6.8462757527733755,
"grad_norm": 0.7718844920164412,
"learning_rate": 5.995984610455141e-08,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787400484085083,
"step": 4320,
"valid_targets_mean": 3495.1,
"valid_targets_min": 881
},
{
"epoch": 6.854199683042789,
"grad_norm": 1.1648381903860865,
"learning_rate": 5.4000259425286415e-08,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2803596556186676,
"step": 4325,
"valid_targets_mean": 2394.1,
"valid_targets_min": 969
},
{
"epoch": 6.862123613312203,
"grad_norm": 0.7006666990793252,
"learning_rate": 4.835214597990856e-08,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2585388720035553,
"step": 4330,
"valid_targets_mean": 3829.1,
"valid_targets_min": 748
},
{
"epoch": 6.870047543581617,
"grad_norm": 0.9365508753028423,
"learning_rate": 4.301559396836519e-08,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896960973739624,
"step": 4335,
"valid_targets_mean": 2411.0,
"valid_targets_min": 1057
},
{
"epoch": 6.87797147385103,
"grad_norm": 0.7887978749058427,
"learning_rate": 3.799068672531769e-08,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780733108520508,
"step": 4340,
"valid_targets_mean": 3101.2,
"valid_targets_min": 1149
},
{
"epoch": 6.885895404120443,
"grad_norm": 0.8049956083558146,
"learning_rate": 3.3277502718835896e-08,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3052785396575928,
"step": 4345,
"valid_targets_mean": 3174.3,
"valid_targets_min": 1707
},
{
"epoch": 6.893819334389858,
"grad_norm": 0.8368946913702296,
"learning_rate": 2.8876115549176796e-08,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26890894770622253,
"step": 4350,
"valid_targets_mean": 2879.1,
"valid_targets_min": 1387
},
{
"epoch": 6.901743264659271,
"grad_norm": 0.8341731874690929,
"learning_rate": 2.4786593947625503e-08,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2666037082672119,
"step": 4355,
"valid_targets_mean": 2962.6,
"valid_targets_min": 1371
},
{
"epoch": 6.9096671949286845,
"grad_norm": 0.8535984792313458,
"learning_rate": 2.1009001775440518e-08,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3076822757720947,
"step": 4360,
"valid_targets_mean": 2713.1,
"valid_targets_min": 984
},
{
"epoch": 6.917591125198098,
"grad_norm": 0.7324014319593888,
"learning_rate": 1.7543398022832337e-08,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23690354824066162,
"step": 4365,
"valid_targets_mean": 3588.8,
"valid_targets_min": 885
},
{
"epoch": 6.925515055467512,
"grad_norm": 0.7088032524121062,
"learning_rate": 1.4389836808066382e-08,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2727454900741577,
"step": 4370,
"valid_targets_mean": 4242.9,
"valid_targets_min": 1335
},
{
"epoch": 6.933438985736926,
"grad_norm": 0.8198153597362804,
"learning_rate": 1.1548367376599257e-08,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867714762687683,
"step": 4375,
"valid_targets_mean": 3238.0,
"valid_targets_min": 1153
},
{
"epoch": 6.941362916006339,
"grad_norm": 0.6663493051614263,
"learning_rate": 9.019034100319347e-09,
"loss": 0.2756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25853022933006287,
"step": 4380,
"valid_targets_mean": 3799.1,
"valid_targets_min": 823
},
{
"epoch": 6.949286846275752,
"grad_norm": 0.8065724319838463,
"learning_rate": 6.801876476854041e-09,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830263078212738,
"step": 4385,
"valid_targets_mean": 3164.6,
"valid_targets_min": 1264
},
{
"epoch": 6.957210776545167,
"grad_norm": 0.9171202573479613,
"learning_rate": 4.896929128943573e-09,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27494555711746216,
"step": 4390,
"valid_targets_mean": 2160.8,
"valid_targets_min": 1141
},
{
"epoch": 6.96513470681458,
"grad_norm": 0.719951132738071,
"learning_rate": 3.3042218039147643e-09,
"loss": 0.284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768862843513489,
"step": 4395,
"valid_targets_mean": 3622.3,
"valid_targets_min": 933
},
{
"epoch": 6.9730586370839935,
"grad_norm": 0.9290612308151752,
"learning_rate": 2.0237793732036384e-09,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2643606960773468,
"step": 4400,
"valid_targets_mean": 2387.6,
"valid_targets_min": 751
},
{
"epoch": 6.980982567353407,
"grad_norm": 0.9045790350311159,
"learning_rate": 1.0556218319757172e-09,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2653629779815674,
"step": 4405,
"valid_targets_mean": 2927.2,
"valid_targets_min": 1066
},
{
"epoch": 6.988906497622821,
"grad_norm": 0.8022249964923563,
"learning_rate": 3.997642988107231e-10,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766302824020386,
"step": 4410,
"valid_targets_mean": 3228.6,
"valid_targets_min": 987
},
{
"epoch": 6.996830427892235,
"grad_norm": 0.8723843600795462,
"learning_rate": 5.62170154649877e-11,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3014870285987854,
"step": 4415,
"valid_targets_mean": 2630.8,
"valid_targets_min": 1016
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24078989028930664,
"step": 4417,
"total_flos": 1125904534470656.0,
"train_loss": 0.35793851753530226,
"train_runtime": 26871.7295,
"train_samples_per_second": 2.627,
"train_steps_per_second": 0.164,
"valid_targets_mean": 2557.6,
"valid_targets_min": 1102
}
],
"logging_steps": 5,
"max_steps": 4417,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1125904534470656.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}