Files
a1-agenttuning_webshop/trainer_state.json
ModelHub XC 31363eafcc 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/a1-agenttuning_webshop
Source: Original Platform
2026-05-13 04:42:35 +08:00

8804 lines
244 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 3983,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008787346221441126,
"grad_norm": 38.6978838722848,
"learning_rate": 4.010025062656642e-07,
"loss": 0.9753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9984568357467651,
"step": 5,
"valid_targets_mean": 8204.4,
"valid_targets_min": 7101
},
{
"epoch": 0.01757469244288225,
"grad_norm": 36.44900496665165,
"learning_rate": 9.022556390977444e-07,
"loss": 1.0116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.9997004270553589,
"step": 10,
"valid_targets_mean": 7846.7,
"valid_targets_min": 7038
},
{
"epoch": 0.026362038664323375,
"grad_norm": 30.270769651579307,
"learning_rate": 1.4035087719298246e-06,
"loss": 0.9528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8993930816650391,
"step": 15,
"valid_targets_mean": 7765.9,
"valid_targets_min": 7114
},
{
"epoch": 0.0351493848857645,
"grad_norm": 21.151573665966424,
"learning_rate": 1.904761904761905e-06,
"loss": 0.8447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.826770007610321,
"step": 20,
"valid_targets_mean": 7497.1,
"valid_targets_min": 7056
},
{
"epoch": 0.043936731107205626,
"grad_norm": 8.682299524123176,
"learning_rate": 2.406015037593985e-06,
"loss": 0.7579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.740318775177002,
"step": 25,
"valid_targets_mean": 7646.0,
"valid_targets_min": 6783
},
{
"epoch": 0.05272407732864675,
"grad_norm": 3.8730139452847805,
"learning_rate": 2.9072681704260652e-06,
"loss": 0.679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6605329513549805,
"step": 30,
"valid_targets_mean": 7726.4,
"valid_targets_min": 7030
},
{
"epoch": 0.061511423550087874,
"grad_norm": 2.072050986380433,
"learning_rate": 3.4085213032581455e-06,
"loss": 0.6448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6354802250862122,
"step": 35,
"valid_targets_mean": 8878.6,
"valid_targets_min": 6835
},
{
"epoch": 0.070298769771529,
"grad_norm": 1.6266156298187409,
"learning_rate": 3.909774436090225e-06,
"loss": 0.6236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6287806034088135,
"step": 40,
"valid_targets_mean": 8068.2,
"valid_targets_min": 1038
},
{
"epoch": 0.07908611599297012,
"grad_norm": 1.378698835683514,
"learning_rate": 4.411027568922306e-06,
"loss": 0.5979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6028242707252502,
"step": 45,
"valid_targets_mean": 7623.4,
"valid_targets_min": 6618
},
{
"epoch": 0.08787346221441125,
"grad_norm": 1.0411202965264905,
"learning_rate": 4.912280701754386e-06,
"loss": 0.6119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6232005953788757,
"step": 50,
"valid_targets_mean": 7622.8,
"valid_targets_min": 6016
},
{
"epoch": 0.09666080843585237,
"grad_norm": 0.7770352727164161,
"learning_rate": 5.413533834586467e-06,
"loss": 0.5674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5420302152633667,
"step": 55,
"valid_targets_mean": 8124.6,
"valid_targets_min": 976
},
{
"epoch": 0.1054481546572935,
"grad_norm": 0.796039133753143,
"learning_rate": 5.9147869674185465e-06,
"loss": 0.5599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5746988654136658,
"step": 60,
"valid_targets_mean": 7137.2,
"valid_targets_min": 1850
},
{
"epoch": 0.11423550087873462,
"grad_norm": 0.6336106625079481,
"learning_rate": 6.416040100250627e-06,
"loss": 0.5348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5362576246261597,
"step": 65,
"valid_targets_mean": 7793.7,
"valid_targets_min": 6922
},
{
"epoch": 0.12302284710017575,
"grad_norm": 0.5700155831436438,
"learning_rate": 6.917293233082707e-06,
"loss": 0.5188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.50221848487854,
"step": 70,
"valid_targets_mean": 7509.6,
"valid_targets_min": 1027
},
{
"epoch": 0.13181019332161686,
"grad_norm": 0.5355565407471911,
"learning_rate": 7.418546365914787e-06,
"loss": 0.5024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5001769661903381,
"step": 75,
"valid_targets_mean": 7870.4,
"valid_targets_min": 7366
},
{
"epoch": 0.140597539543058,
"grad_norm": 0.49202281440443324,
"learning_rate": 7.919799498746868e-06,
"loss": 0.4863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.466791570186615,
"step": 80,
"valid_targets_mean": 7792.9,
"valid_targets_min": 6296
},
{
"epoch": 0.14938488576449913,
"grad_norm": 0.4667523533023862,
"learning_rate": 8.421052631578948e-06,
"loss": 0.4748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4645511507987976,
"step": 85,
"valid_targets_mean": 7683.8,
"valid_targets_min": 6859
},
{
"epoch": 0.15817223198594024,
"grad_norm": 0.46381986185960605,
"learning_rate": 8.922305764411027e-06,
"loss": 0.4505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44488275051116943,
"step": 90,
"valid_targets_mean": 7648.6,
"valid_targets_min": 6536
},
{
"epoch": 0.16695957820738136,
"grad_norm": 0.49268227301820733,
"learning_rate": 9.423558897243108e-06,
"loss": 0.4527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4484066069126129,
"step": 95,
"valid_targets_mean": 7653.2,
"valid_targets_min": 6951
},
{
"epoch": 0.1757469244288225,
"grad_norm": 0.4684597306217091,
"learning_rate": 9.924812030075189e-06,
"loss": 0.4377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43168944120407104,
"step": 100,
"valid_targets_mean": 7581.9,
"valid_targets_min": 6596
},
{
"epoch": 0.18453427065026362,
"grad_norm": 0.4533014610851105,
"learning_rate": 1.0426065162907268e-05,
"loss": 0.4206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.411173015832901,
"step": 105,
"valid_targets_mean": 7877.8,
"valid_targets_min": 7346
},
{
"epoch": 0.19332161687170474,
"grad_norm": 0.420632290889455,
"learning_rate": 1.0927318295739348e-05,
"loss": 0.4179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40126168727874756,
"step": 110,
"valid_targets_mean": 8554.2,
"valid_targets_min": 7236
},
{
"epoch": 0.20210896309314588,
"grad_norm": 0.4742732806072542,
"learning_rate": 1.1428571428571429e-05,
"loss": 0.4146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4155147075653076,
"step": 115,
"valid_targets_mean": 8634.9,
"valid_targets_min": 1832
},
{
"epoch": 0.210896309314587,
"grad_norm": 0.4594208243066726,
"learning_rate": 1.192982456140351e-05,
"loss": 0.4177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3859213888645172,
"step": 120,
"valid_targets_mean": 7575.8,
"valid_targets_min": 6708
},
{
"epoch": 0.21968365553602812,
"grad_norm": 0.4997540440424557,
"learning_rate": 1.2431077694235589e-05,
"loss": 0.4037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3957754969596863,
"step": 125,
"valid_targets_mean": 7793.8,
"valid_targets_min": 7241
},
{
"epoch": 0.22847100175746923,
"grad_norm": 0.428361000886045,
"learning_rate": 1.293233082706767e-05,
"loss": 0.4002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3891918659210205,
"step": 130,
"valid_targets_mean": 8369.6,
"valid_targets_min": 7025
},
{
"epoch": 0.23725834797891038,
"grad_norm": 0.4743185424801239,
"learning_rate": 1.343358395989975e-05,
"loss": 0.405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3979344964027405,
"step": 135,
"valid_targets_mean": 7767.6,
"valid_targets_min": 6628
},
{
"epoch": 0.2460456942003515,
"grad_norm": 0.4841423226769736,
"learning_rate": 1.3934837092731829e-05,
"loss": 0.4012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3948283791542053,
"step": 140,
"valid_targets_mean": 7875.4,
"valid_targets_min": 7146
},
{
"epoch": 0.2548330404217926,
"grad_norm": 0.588951244848714,
"learning_rate": 1.443609022556391e-05,
"loss": 0.3951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4132270812988281,
"step": 145,
"valid_targets_mean": 8222.6,
"valid_targets_min": 6658
},
{
"epoch": 0.26362038664323373,
"grad_norm": 0.5495889925349385,
"learning_rate": 1.493734335839599e-05,
"loss": 0.3902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38743358850479126,
"step": 150,
"valid_targets_mean": 7656.6,
"valid_targets_min": 6637
},
{
"epoch": 0.27240773286467485,
"grad_norm": 0.5958013982628857,
"learning_rate": 1.543859649122807e-05,
"loss": 0.3796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3920867443084717,
"step": 155,
"valid_targets_mean": 7690.2,
"valid_targets_min": 6713
},
{
"epoch": 0.281195079086116,
"grad_norm": 0.46010368035874943,
"learning_rate": 1.593984962406015e-05,
"loss": 0.3743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36779534816741943,
"step": 160,
"valid_targets_mean": 7557.8,
"valid_targets_min": 1962
},
{
"epoch": 0.28998242530755713,
"grad_norm": 0.5929789279662462,
"learning_rate": 1.6441102756892233e-05,
"loss": 0.3778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3819672167301178,
"step": 165,
"valid_targets_mean": 7351.0,
"valid_targets_min": 4393
},
{
"epoch": 0.29876977152899825,
"grad_norm": 0.5524672538423943,
"learning_rate": 1.694235588972431e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36684030294418335,
"step": 170,
"valid_targets_mean": 7323.3,
"valid_targets_min": 4028
},
{
"epoch": 0.30755711775043937,
"grad_norm": 0.6041910949646787,
"learning_rate": 1.744360902255639e-05,
"loss": 0.378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3752996623516083,
"step": 175,
"valid_targets_mean": 7826.6,
"valid_targets_min": 6948
},
{
"epoch": 0.3163444639718805,
"grad_norm": 0.5273237629264332,
"learning_rate": 1.7944862155388473e-05,
"loss": 0.3734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3750697374343872,
"step": 180,
"valid_targets_mean": 8417.7,
"valid_targets_min": 6580
},
{
"epoch": 0.3251318101933216,
"grad_norm": 0.5634785021242477,
"learning_rate": 1.8446115288220552e-05,
"loss": 0.3701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3679591715335846,
"step": 185,
"valid_targets_mean": 8481.8,
"valid_targets_min": 7148
},
{
"epoch": 0.3339191564147627,
"grad_norm": 0.6490715556412919,
"learning_rate": 1.894736842105263e-05,
"loss": 0.3707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35834622383117676,
"step": 190,
"valid_targets_mean": 7840.2,
"valid_targets_min": 7374
},
{
"epoch": 0.3427065026362039,
"grad_norm": 0.7040665040619704,
"learning_rate": 1.9448621553884713e-05,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.360437273979187,
"step": 195,
"valid_targets_mean": 7532.4,
"valid_targets_min": 6567
},
{
"epoch": 0.351493848857645,
"grad_norm": 0.6661072177146762,
"learning_rate": 1.9949874686716792e-05,
"loss": 0.3675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3582548499107361,
"step": 200,
"valid_targets_mean": 7941.7,
"valid_targets_min": 4770
},
{
"epoch": 0.3602811950790861,
"grad_norm": 0.6446147681036916,
"learning_rate": 2.045112781954887e-05,
"loss": 0.3674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3482518792152405,
"step": 205,
"valid_targets_mean": 7836.3,
"valid_targets_min": 6808
},
{
"epoch": 0.36906854130052724,
"grad_norm": 0.7425622932228986,
"learning_rate": 2.0952380952380954e-05,
"loss": 0.3641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3838837742805481,
"step": 210,
"valid_targets_mean": 7816.9,
"valid_targets_min": 7214
},
{
"epoch": 0.37785588752196836,
"grad_norm": 0.5581982531493921,
"learning_rate": 2.1453634085213033e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36858636140823364,
"step": 215,
"valid_targets_mean": 7943.6,
"valid_targets_min": 7011
},
{
"epoch": 0.3866432337434095,
"grad_norm": 0.5795300028635507,
"learning_rate": 2.1954887218045115e-05,
"loss": 0.3665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36795204877853394,
"step": 220,
"valid_targets_mean": 7693.4,
"valid_targets_min": 6714
},
{
"epoch": 0.3954305799648506,
"grad_norm": 0.5961129101229606,
"learning_rate": 2.2456140350877194e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35297703742980957,
"step": 225,
"valid_targets_mean": 7667.0,
"valid_targets_min": 7113
},
{
"epoch": 0.40421792618629176,
"grad_norm": 0.5346483708070339,
"learning_rate": 2.2957393483709277e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.355159193277359,
"step": 230,
"valid_targets_mean": 7672.8,
"valid_targets_min": 6972
},
{
"epoch": 0.4130052724077329,
"grad_norm": 0.6007854655638409,
"learning_rate": 2.3458646616541356e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34793052077293396,
"step": 235,
"valid_targets_mean": 7685.1,
"valid_targets_min": 6490
},
{
"epoch": 0.421792618629174,
"grad_norm": 0.6225739772119563,
"learning_rate": 2.3959899749373438e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3514181971549988,
"step": 240,
"valid_targets_mean": 7597.9,
"valid_targets_min": 6470
},
{
"epoch": 0.4305799648506151,
"grad_norm": 0.5289284486385892,
"learning_rate": 2.4461152882205514e-05,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3455802798271179,
"step": 245,
"valid_targets_mean": 7803.9,
"valid_targets_min": 7042
},
{
"epoch": 0.43936731107205623,
"grad_norm": 0.6527177005189011,
"learning_rate": 2.4962406015037596e-05,
"loss": 0.3401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3467724323272705,
"step": 250,
"valid_targets_mean": 7513.4,
"valid_targets_min": 6591
},
{
"epoch": 0.44815465729349735,
"grad_norm": 0.592816842394283,
"learning_rate": 2.5463659147869675e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3463764190673828,
"step": 255,
"valid_targets_mean": 7793.3,
"valid_targets_min": 6874
},
{
"epoch": 0.45694200351493847,
"grad_norm": 0.5890938532081315,
"learning_rate": 2.5964912280701757e-05,
"loss": 0.3586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36159226298332214,
"step": 260,
"valid_targets_mean": 7705.4,
"valid_targets_min": 6749
},
{
"epoch": 0.46572934973637964,
"grad_norm": 0.5980314248262064,
"learning_rate": 2.6466165413533836e-05,
"loss": 0.3551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35110318660736084,
"step": 265,
"valid_targets_mean": 8175.6,
"valid_targets_min": 7201
},
{
"epoch": 0.47451669595782076,
"grad_norm": 0.49692421838506523,
"learning_rate": 2.696741854636592e-05,
"loss": 0.3583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3421872854232788,
"step": 270,
"valid_targets_mean": 8735.7,
"valid_targets_min": 7134
},
{
"epoch": 0.4833040421792619,
"grad_norm": 0.7089117092095248,
"learning_rate": 2.7468671679197994e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3664856553077698,
"step": 275,
"valid_targets_mean": 7563.2,
"valid_targets_min": 6711
},
{
"epoch": 0.492091388400703,
"grad_norm": 0.6619046729096473,
"learning_rate": 2.7969924812030077e-05,
"loss": 0.3564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38198232650756836,
"step": 280,
"valid_targets_mean": 8438.1,
"valid_targets_min": 6326
},
{
"epoch": 0.5008787346221442,
"grad_norm": 0.8062671883298813,
"learning_rate": 2.8471177944862156e-05,
"loss": 0.3461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3398236632347107,
"step": 285,
"valid_targets_mean": 7585.6,
"valid_targets_min": 6803
},
{
"epoch": 0.5096660808435852,
"grad_norm": 0.5995976148755775,
"learning_rate": 2.8972431077694238e-05,
"loss": 0.3583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35415637493133545,
"step": 290,
"valid_targets_mean": 9409.5,
"valid_targets_min": 7583
},
{
"epoch": 0.5184534270650264,
"grad_norm": 0.49270556955808065,
"learning_rate": 2.9473684210526317e-05,
"loss": 0.3473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.332955002784729,
"step": 295,
"valid_targets_mean": 8608.6,
"valid_targets_min": 6638
},
{
"epoch": 0.5272407732864675,
"grad_norm": 0.6063298210454802,
"learning_rate": 2.99749373433584e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35231274366378784,
"step": 300,
"valid_targets_mean": 7578.2,
"valid_targets_min": 6504
},
{
"epoch": 0.5360281195079086,
"grad_norm": 0.6270112520829497,
"learning_rate": 3.047619047619048e-05,
"loss": 0.3486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3481753170490265,
"step": 305,
"valid_targets_mean": 7567.4,
"valid_targets_min": 6744
},
{
"epoch": 0.5448154657293497,
"grad_norm": 0.5807218083467116,
"learning_rate": 3.097744360902256e-05,
"loss": 0.35,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3547857403755188,
"step": 310,
"valid_targets_mean": 7679.1,
"valid_targets_min": 6530
},
{
"epoch": 0.5536028119507909,
"grad_norm": 0.5797707420078969,
"learning_rate": 3.147869674185464e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3483213782310486,
"step": 315,
"valid_targets_mean": 7858.9,
"valid_targets_min": 7052
},
{
"epoch": 0.562390158172232,
"grad_norm": 0.5659965873691432,
"learning_rate": 3.197994987468672e-05,
"loss": 0.3397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32356488704681396,
"step": 320,
"valid_targets_mean": 8695.8,
"valid_targets_min": 7163
},
{
"epoch": 0.5711775043936731,
"grad_norm": 0.549458311776311,
"learning_rate": 3.24812030075188e-05,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3535029888153076,
"step": 325,
"valid_targets_mean": 7525.9,
"valid_targets_min": 6717
},
{
"epoch": 0.5799648506151143,
"grad_norm": 0.6488259689086234,
"learning_rate": 3.298245614035088e-05,
"loss": 0.3426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33021873235702515,
"step": 330,
"valid_targets_mean": 8136.8,
"valid_targets_min": 7100
},
{
"epoch": 0.5887521968365553,
"grad_norm": 0.6190982787223087,
"learning_rate": 3.3483709273182956e-05,
"loss": 0.3433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3612127900123596,
"step": 335,
"valid_targets_mean": 7711.2,
"valid_targets_min": 6996
},
{
"epoch": 0.5975395430579965,
"grad_norm": 0.7134611976932143,
"learning_rate": 3.398496240601504e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32457542419433594,
"step": 340,
"valid_targets_mean": 7711.4,
"valid_targets_min": 6467
},
{
"epoch": 0.6063268892794376,
"grad_norm": 0.4825474653552003,
"learning_rate": 3.448621553884712e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33146989345550537,
"step": 345,
"valid_targets_mean": 8664.6,
"valid_targets_min": 6905
},
{
"epoch": 0.6151142355008787,
"grad_norm": 0.6066546859254534,
"learning_rate": 3.49874686716792e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3363463878631592,
"step": 350,
"valid_targets_mean": 7706.2,
"valid_targets_min": 6749
},
{
"epoch": 0.6239015817223199,
"grad_norm": 0.5358291220456245,
"learning_rate": 3.548872180451128e-05,
"loss": 0.3438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35363635420799255,
"step": 355,
"valid_targets_mean": 8824.1,
"valid_targets_min": 6443
},
{
"epoch": 0.632688927943761,
"grad_norm": 0.5400754436186094,
"learning_rate": 3.5989974937343364e-05,
"loss": 0.3357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33272236585617065,
"step": 360,
"valid_targets_mean": 7586.1,
"valid_targets_min": 6781
},
{
"epoch": 0.6414762741652021,
"grad_norm": 0.5505762025043917,
"learning_rate": 3.649122807017544e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.337479829788208,
"step": 365,
"valid_targets_mean": 7690.2,
"valid_targets_min": 7086
},
{
"epoch": 0.6502636203866432,
"grad_norm": 0.5973982759050109,
"learning_rate": 3.699248120300752e-05,
"loss": 0.3412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35638201236724854,
"step": 370,
"valid_targets_mean": 7434.1,
"valid_targets_min": 6424
},
{
"epoch": 0.6590509666080844,
"grad_norm": 0.5693931599659594,
"learning_rate": 3.74937343358396e-05,
"loss": 0.3424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.338626891374588,
"step": 375,
"valid_targets_mean": 7283.1,
"valid_targets_min": 3803
},
{
"epoch": 0.6678383128295254,
"grad_norm": 0.5971595429698976,
"learning_rate": 3.799498746867168e-05,
"loss": 0.3445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3575047552585602,
"step": 380,
"valid_targets_mean": 7449.1,
"valid_targets_min": 6542
},
{
"epoch": 0.6766256590509666,
"grad_norm": 0.5578406633304958,
"learning_rate": 3.849624060150376e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32988211512565613,
"step": 385,
"valid_targets_mean": 7770.6,
"valid_targets_min": 6719
},
{
"epoch": 0.6854130052724078,
"grad_norm": 0.5668191415205301,
"learning_rate": 3.8997493734335845e-05,
"loss": 0.3394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3269059956073761,
"step": 390,
"valid_targets_mean": 7783.9,
"valid_targets_min": 6911
},
{
"epoch": 0.6942003514938488,
"grad_norm": 0.5498326107964799,
"learning_rate": 3.949874686716792e-05,
"loss": 0.3354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32613101601600647,
"step": 395,
"valid_targets_mean": 7709.3,
"valid_targets_min": 6875
},
{
"epoch": 0.70298769771529,
"grad_norm": 0.5545998996247578,
"learning_rate": 4e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.335163950920105,
"step": 400,
"valid_targets_mean": 7833.9,
"valid_targets_min": 7032
},
{
"epoch": 0.7117750439367311,
"grad_norm": 0.5467208617580587,
"learning_rate": 3.999980791075177e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3213801980018616,
"step": 405,
"valid_targets_mean": 7722.5,
"valid_targets_min": 7033
},
{
"epoch": 0.7205623901581723,
"grad_norm": 0.5385613574993566,
"learning_rate": 3.999923164669689e-05,
"loss": 0.3355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3487439751625061,
"step": 410,
"valid_targets_mean": 7201.6,
"valid_targets_min": 735
},
{
"epoch": 0.7293497363796133,
"grad_norm": 0.5542392343867473,
"learning_rate": 3.9998271218904776e-05,
"loss": 0.3342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3364104628562927,
"step": 415,
"valid_targets_mean": 7159.6,
"valid_targets_min": 791
},
{
"epoch": 0.7381370826010545,
"grad_norm": 0.5169891050813411,
"learning_rate": 3.999692664582422e-05,
"loss": 0.3268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32832974195480347,
"step": 420,
"valid_targets_mean": 7732.6,
"valid_targets_min": 7105
},
{
"epoch": 0.7469244288224957,
"grad_norm": 0.5031414610488824,
"learning_rate": 3.999519795328302e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33884960412979126,
"step": 425,
"valid_targets_mean": 9959.8,
"valid_targets_min": 7246
},
{
"epoch": 0.7557117750439367,
"grad_norm": 0.5026124113090491,
"learning_rate": 3.9993085174487494e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32484903931617737,
"step": 430,
"valid_targets_mean": 8865.3,
"valid_targets_min": 6744
},
{
"epoch": 0.7644991212653779,
"grad_norm": 0.4817890109970856,
"learning_rate": 3.999058835002187e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3292863368988037,
"step": 435,
"valid_targets_mean": 7735.2,
"valid_targets_min": 7043
},
{
"epoch": 0.773286467486819,
"grad_norm": 0.4936188500345479,
"learning_rate": 3.998770752784745e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3398468494415283,
"step": 440,
"valid_targets_mean": 8204.1,
"valid_targets_min": 5811
},
{
"epoch": 0.7820738137082601,
"grad_norm": 0.6464708805528303,
"learning_rate": 3.998444276330172e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325589656829834,
"step": 445,
"valid_targets_mean": 7733.5,
"valid_targets_min": 6404
},
{
"epoch": 0.7908611599297012,
"grad_norm": 0.5662160775112339,
"learning_rate": 3.998079411909731e-05,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3355258107185364,
"step": 450,
"valid_targets_mean": 7588.7,
"valid_targets_min": 6381
},
{
"epoch": 0.7996485061511424,
"grad_norm": 0.5147294588993504,
"learning_rate": 3.997676166532076e-05,
"loss": 0.3246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.331130713224411,
"step": 455,
"valid_targets_mean": 7780.9,
"valid_targets_min": 6994
},
{
"epoch": 0.8084358523725835,
"grad_norm": 0.48151422115917686,
"learning_rate": 3.997234547943116e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3537714183330536,
"step": 460,
"valid_targets_mean": 7668.2,
"valid_targets_min": 6956
},
{
"epoch": 0.8172231985940246,
"grad_norm": 0.5152148119091646,
"learning_rate": 3.9967545646258684e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34110844135284424,
"step": 465,
"valid_targets_mean": 7722.5,
"valid_targets_min": 7138
},
{
"epoch": 0.8260105448154658,
"grad_norm": 0.5327181478773625,
"learning_rate": 3.996236225800298e-05,
"loss": 0.3299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3305248022079468,
"step": 470,
"valid_targets_mean": 7872.7,
"valid_targets_min": 7232
},
{
"epoch": 0.8347978910369068,
"grad_norm": 0.4832077772333212,
"learning_rate": 3.995679541423137e-05,
"loss": 0.332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3223893642425537,
"step": 475,
"valid_targets_mean": 8212.9,
"valid_targets_min": 1033
},
{
"epoch": 0.843585237258348,
"grad_norm": 0.5352684147985118,
"learning_rate": 3.9950845221876926e-05,
"loss": 0.3348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3198257386684418,
"step": 480,
"valid_targets_mean": 7823.2,
"valid_targets_min": 6958
},
{
"epoch": 0.8523725834797891,
"grad_norm": 0.5561370729488068,
"learning_rate": 3.994451179523644e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3468901515007019,
"step": 485,
"valid_targets_mean": 7766.8,
"valid_targets_min": 7054
},
{
"epoch": 0.8611599297012302,
"grad_norm": 0.49490216854159513,
"learning_rate": 3.993779525596824e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325663298368454,
"step": 490,
"valid_targets_mean": 7161.1,
"valid_targets_min": 889
},
{
"epoch": 0.8699472759226714,
"grad_norm": 0.5556201651984429,
"learning_rate": 3.993069573308982e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3325248956680298,
"step": 495,
"valid_targets_mean": 7954.0,
"valid_targets_min": 6859
},
{
"epoch": 0.8787346221441125,
"grad_norm": 0.5767089291539206,
"learning_rate": 3.992321336297537e-05,
"loss": 0.3349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32498735189437866,
"step": 500,
"valid_targets_mean": 7508.8,
"valid_targets_min": 6708
},
{
"epoch": 0.8875219683655536,
"grad_norm": 0.592345847494032,
"learning_rate": 3.99153482893532e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3253369629383087,
"step": 505,
"valid_targets_mean": 7774.0,
"valid_targets_min": 6744
},
{
"epoch": 0.8963093145869947,
"grad_norm": 0.5437305711608164,
"learning_rate": 3.99071006633029e-05,
"loss": 0.3348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3150107264518738,
"step": 510,
"valid_targets_mean": 7838.1,
"valid_targets_min": 7349
},
{
"epoch": 0.9050966608084359,
"grad_norm": 0.6455180582172454,
"learning_rate": 3.9898470643252496e-05,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31834477186203003,
"step": 515,
"valid_targets_mean": 7792.3,
"valid_targets_min": 7277
},
{
"epoch": 0.9138840070298769,
"grad_norm": 0.5860488049976041,
"learning_rate": 3.9889458394975404e-05,
"loss": 0.3369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3431106209754944,
"step": 520,
"valid_targets_mean": 7672.0,
"valid_targets_min": 6788
},
{
"epoch": 0.9226713532513181,
"grad_norm": 0.49869424349859637,
"learning_rate": 3.9880064091587226e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3385096788406372,
"step": 525,
"valid_targets_mean": 8874.5,
"valid_targets_min": 7049
},
{
"epoch": 0.9314586994727593,
"grad_norm": 0.4791798901114336,
"learning_rate": 3.9870287913542416e-05,
"loss": 0.3275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3190639317035675,
"step": 530,
"valid_targets_mean": 7695.1,
"valid_targets_min": 7294
},
{
"epoch": 0.9402460456942003,
"grad_norm": 0.5268875896832551,
"learning_rate": 3.9860130048630855e-05,
"loss": 0.3299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3270207345485687,
"step": 535,
"valid_targets_mean": 8432.9,
"valid_targets_min": 6766
},
{
"epoch": 0.9490333919156415,
"grad_norm": 0.5109366805942274,
"learning_rate": 3.9849590691974206e-05,
"loss": 0.3251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33174222707748413,
"step": 540,
"valid_targets_mean": 7830.2,
"valid_targets_min": 7068
},
{
"epoch": 0.9578207381370826,
"grad_norm": 0.5965366370776712,
"learning_rate": 3.9838670046022166e-05,
"loss": 0.3245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3299826979637146,
"step": 545,
"valid_targets_mean": 7773.7,
"valid_targets_min": 7215
},
{
"epoch": 0.9666080843585237,
"grad_norm": 0.4847692573044287,
"learning_rate": 3.982736832054862e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3373975157737732,
"step": 550,
"valid_targets_mean": 7721.5,
"valid_targets_min": 6768
},
{
"epoch": 0.9753954305799648,
"grad_norm": 0.5236300498438478,
"learning_rate": 3.9815685732647556e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31755590438842773,
"step": 555,
"valid_targets_mean": 7896.3,
"valid_targets_min": 7133
},
{
"epoch": 0.984182776801406,
"grad_norm": 0.5487102288494853,
"learning_rate": 3.9803622506728916e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31796884536743164,
"step": 560,
"valid_targets_mean": 8345.5,
"valid_targets_min": 6772
},
{
"epoch": 0.9929701230228472,
"grad_norm": 0.48622322101501725,
"learning_rate": 3.9791178874514314e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005170524120331,
"step": 565,
"valid_targets_mean": 7888.6,
"valid_targets_min": 7338
},
{
"epoch": 1.0017574692442883,
"grad_norm": 0.5209897970025318,
"learning_rate": 3.977835507503254e-05,
"loss": 0.3191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32238900661468506,
"step": 570,
"valid_targets_mean": 9126.5,
"valid_targets_min": 7123
},
{
"epoch": 1.0105448154657293,
"grad_norm": 0.5277875114886403,
"learning_rate": 3.9765151354614995e-05,
"loss": 0.3235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3237850069999695,
"step": 575,
"valid_targets_mean": 7542.9,
"valid_targets_min": 6828
},
{
"epoch": 1.0193321616871704,
"grad_norm": 0.5597616301590367,
"learning_rate": 3.9751567966890946e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32237479090690613,
"step": 580,
"valid_targets_mean": 7596.3,
"valid_targets_min": 6688
},
{
"epoch": 1.0281195079086116,
"grad_norm": 0.5285554956078993,
"learning_rate": 3.973760517278268e-05,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3246050775051117,
"step": 585,
"valid_targets_mean": 7218.9,
"valid_targets_min": 967
},
{
"epoch": 1.0369068541300528,
"grad_norm": 0.5016573118247876,
"learning_rate": 3.972326324050045e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3259458541870117,
"step": 590,
"valid_targets_mean": 7718.3,
"valid_targets_min": 6451
},
{
"epoch": 1.0456942003514937,
"grad_norm": 0.47518350285088584,
"learning_rate": 3.970854244553736e-05,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33282628655433655,
"step": 595,
"valid_targets_mean": 7674.4,
"valid_targets_min": 7189
},
{
"epoch": 1.054481546572935,
"grad_norm": 0.5009335948586953,
"learning_rate": 3.969344307066404e-05,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3331737816333771,
"step": 600,
"valid_targets_mean": 7871.4,
"valid_targets_min": 7054
},
{
"epoch": 1.063268892794376,
"grad_norm": 0.5651686519634432,
"learning_rate": 3.967796540592327e-05,
"loss": 0.3183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3132637143135071,
"step": 605,
"valid_targets_mean": 7547.6,
"valid_targets_min": 6890
},
{
"epoch": 1.0720562390158173,
"grad_norm": 0.42436518651387334,
"learning_rate": 3.966210974862433e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30082017183303833,
"step": 610,
"valid_targets_mean": 7801.0,
"valid_targets_min": 6996
},
{
"epoch": 1.0808435852372584,
"grad_norm": 0.543738759441098,
"learning_rate": 3.964587640333736e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31432604789733887,
"step": 615,
"valid_targets_mean": 7765.2,
"valid_targets_min": 6892
},
{
"epoch": 1.0896309314586994,
"grad_norm": 0.5181416198044555,
"learning_rate": 3.9629265681887456e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32652005553245544,
"step": 620,
"valid_targets_mean": 7536.4,
"valid_targets_min": 5784
},
{
"epoch": 1.0984182776801406,
"grad_norm": 0.5140276582122142,
"learning_rate": 3.961227790334872e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31211698055267334,
"step": 625,
"valid_targets_mean": 7735.3,
"valid_targets_min": 7001
},
{
"epoch": 1.1072056239015817,
"grad_norm": 0.5282119837909162,
"learning_rate": 3.959491339403814e-05,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33794674277305603,
"step": 630,
"valid_targets_mean": 7889.0,
"valid_targets_min": 6956
},
{
"epoch": 1.115992970123023,
"grad_norm": 0.47248502297977735,
"learning_rate": 3.957717248750923e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3132312595844269,
"step": 635,
"valid_targets_mean": 9497.9,
"valid_targets_min": 7402
},
{
"epoch": 1.124780316344464,
"grad_norm": 0.6004536131705314,
"learning_rate": 3.9559055524545755e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32647284865379333,
"step": 640,
"valid_targets_mean": 7229.4,
"valid_targets_min": 1051
},
{
"epoch": 1.133567662565905,
"grad_norm": 0.6010689936463117,
"learning_rate": 3.9540562853155086e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3334662914276123,
"step": 645,
"valid_targets_mean": 7780.3,
"valid_targets_min": 6782
},
{
"epoch": 1.1423550087873462,
"grad_norm": 0.4885332419281782,
"learning_rate": 3.9521694828561566e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3191852867603302,
"step": 650,
"valid_targets_mean": 7669.9,
"valid_targets_min": 7189
},
{
"epoch": 1.1511423550087874,
"grad_norm": 0.5719088465025136,
"learning_rate": 3.950245181319965e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3156038522720337,
"step": 655,
"valid_targets_mean": 7323.6,
"valid_targets_min": 4561
},
{
"epoch": 1.1599297012302285,
"grad_norm": 0.48450178709647856,
"learning_rate": 3.948283417670698e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31226205825805664,
"step": 660,
"valid_targets_mean": 7599.6,
"valid_targets_min": 6959
},
{
"epoch": 1.1687170474516697,
"grad_norm": 0.5336121025006089,
"learning_rate": 3.9462842295917254e-05,
"loss": 0.326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320054292678833,
"step": 665,
"valid_targets_mean": 7689.0,
"valid_targets_min": 6442
},
{
"epoch": 1.1775043936731107,
"grad_norm": 0.5168172619234773,
"learning_rate": 3.944247655485302e-05,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3125112056732178,
"step": 670,
"valid_targets_mean": 7615.4,
"valid_targets_min": 7042
},
{
"epoch": 1.1862917398945518,
"grad_norm": 0.5306935722278405,
"learning_rate": 3.942173734471825e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3204430341720581,
"step": 675,
"valid_targets_mean": 7598.4,
"valid_targets_min": 6504
},
{
"epoch": 1.195079086115993,
"grad_norm": 0.49391490325677384,
"learning_rate": 3.940062506389089e-05,
"loss": 0.3173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32571330666542053,
"step": 680,
"valid_targets_mean": 7688.0,
"valid_targets_min": 6977
},
{
"epoch": 1.2038664323374342,
"grad_norm": 0.4931314528962855,
"learning_rate": 3.937914011791513e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33908209204673767,
"step": 685,
"valid_targets_mean": 8584.7,
"valid_targets_min": 7423
},
{
"epoch": 1.2126537785588751,
"grad_norm": 0.48655008582263876,
"learning_rate": 3.9357282919493717e-05,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32384777069091797,
"step": 690,
"valid_targets_mean": 7632.4,
"valid_targets_min": 5869
},
{
"epoch": 1.2214411247803163,
"grad_norm": 0.500738194693758,
"learning_rate": 3.93350538884799e-05,
"loss": 0.3219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33496755361557007,
"step": 695,
"valid_targets_mean": 7711.9,
"valid_targets_min": 6950
},
{
"epoch": 1.2302284710017575,
"grad_norm": 0.5352717845302437,
"learning_rate": 3.931245345186949e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30350565910339355,
"step": 700,
"valid_targets_mean": 8455.4,
"valid_targets_min": 6773
},
{
"epoch": 1.2390158172231986,
"grad_norm": 0.4775215505295606,
"learning_rate": 3.928948204379256e-05,
"loss": 0.3206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3287331461906433,
"step": 705,
"valid_targets_mean": 7821.4,
"valid_targets_min": 7257
},
{
"epoch": 1.2478031634446398,
"grad_norm": 0.4829129399145732,
"learning_rate": 3.926614010550516e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3171924352645874,
"step": 710,
"valid_targets_mean": 7675.7,
"valid_targets_min": 6679
},
{
"epoch": 1.2565905096660808,
"grad_norm": 0.4483991183139604,
"learning_rate": 3.924242808538083e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31392353773117065,
"step": 715,
"valid_targets_mean": 7726.5,
"valid_targets_min": 6153
},
{
"epoch": 1.265377855887522,
"grad_norm": 0.5014168550769796,
"learning_rate": 3.9218346438901996e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.317163348197937,
"step": 720,
"valid_targets_mean": 7591.8,
"valid_targets_min": 6396
},
{
"epoch": 1.2741652021089631,
"grad_norm": 0.5122275835888518,
"learning_rate": 3.9193895628651174e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3096388876438141,
"step": 725,
"valid_targets_mean": 7610.3,
"valid_targets_min": 6982
},
{
"epoch": 1.2829525483304043,
"grad_norm": 0.48739308701526257,
"learning_rate": 3.916907612430215e-05,
"loss": 0.3184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3071346879005432,
"step": 730,
"valid_targets_mean": 8241.4,
"valid_targets_min": 7084
},
{
"epoch": 1.2917398945518452,
"grad_norm": 0.5284650604703849,
"learning_rate": 3.914388840261092e-05,
"loss": 0.323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3126200735569,
"step": 735,
"valid_targets_mean": 7693.7,
"valid_targets_min": 6791
},
{
"epoch": 1.3005272407732864,
"grad_norm": 0.4857415987362,
"learning_rate": 3.911833294740653e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.328471302986145,
"step": 740,
"valid_targets_mean": 7574.6,
"valid_targets_min": 5191
},
{
"epoch": 1.3093145869947276,
"grad_norm": 0.41085987983419675,
"learning_rate": 3.9092410249581794e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30733928084373474,
"step": 745,
"valid_targets_mean": 7675.6,
"valid_targets_min": 6926
},
{
"epoch": 1.3181019332161688,
"grad_norm": 0.45850657958304913,
"learning_rate": 3.9066120807083875e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3096606433391571,
"step": 750,
"valid_targets_mean": 7721.5,
"valid_targets_min": 7048
},
{
"epoch": 1.32688927943761,
"grad_norm": 0.5218607509428387,
"learning_rate": 3.90394651249047e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3240182399749756,
"step": 755,
"valid_targets_mean": 7440.1,
"valid_targets_min": 6248
},
{
"epoch": 1.335676625659051,
"grad_norm": 0.5226476860028977,
"learning_rate": 3.901244371507126e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3309449553489685,
"step": 760,
"valid_targets_mean": 7491.1,
"valid_targets_min": 6608
},
{
"epoch": 1.344463971880492,
"grad_norm": 0.48601085019051943,
"learning_rate": 3.898505709663578e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3042697310447693,
"step": 765,
"valid_targets_mean": 7941.6,
"valid_targets_min": 598
},
{
"epoch": 1.3532513181019332,
"grad_norm": 0.5192638452483873,
"learning_rate": 3.895730579566576e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.335843950510025,
"step": 770,
"valid_targets_mean": 8004.8,
"valid_targets_min": 792
},
{
"epoch": 1.3620386643233744,
"grad_norm": 0.49021475730604136,
"learning_rate": 3.892919034523385e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31338605284690857,
"step": 775,
"valid_targets_mean": 7635.1,
"valid_targets_min": 3605
},
{
"epoch": 1.3708260105448153,
"grad_norm": 0.4732842882172017,
"learning_rate": 3.8900711285407625e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34282398223876953,
"step": 780,
"valid_targets_mean": 7690.4,
"valid_targets_min": 6795
},
{
"epoch": 1.3796133567662565,
"grad_norm": 0.43326778052686593,
"learning_rate": 3.887186916323921e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3298339247703552,
"step": 785,
"valid_targets_mean": 9189.6,
"valid_targets_min": 7063
},
{
"epoch": 1.3884007029876977,
"grad_norm": 0.4569354721607761,
"learning_rate": 3.884266453275476e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31393471360206604,
"step": 790,
"valid_targets_mean": 7767.4,
"valid_targets_min": 6796
},
{
"epoch": 1.3971880492091389,
"grad_norm": 0.41395577038033143,
"learning_rate": 3.8813097954943814e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2988349199295044,
"step": 795,
"valid_targets_mean": 7797.6,
"valid_targets_min": 6788
},
{
"epoch": 1.40597539543058,
"grad_norm": 0.44276378335869104,
"learning_rate": 3.878316999774856e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3206707239151001,
"step": 800,
"valid_targets_mean": 8609.4,
"valid_targets_min": 6835
},
{
"epoch": 1.4147627416520212,
"grad_norm": 0.4785714205137601,
"learning_rate": 3.8752881236052864e-05,
"loss": 0.3179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3262031674385071,
"step": 805,
"valid_targets_mean": 7643.6,
"valid_targets_min": 7144
},
{
"epoch": 1.4235500878734622,
"grad_norm": 0.4654192860411442,
"learning_rate": 3.872223225167129e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31912875175476074,
"step": 810,
"valid_targets_mean": 8542.4,
"valid_targets_min": 6823
},
{
"epoch": 1.4323374340949033,
"grad_norm": 0.4566427062230126,
"learning_rate": 3.8691223633337854e-05,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31717827916145325,
"step": 815,
"valid_targets_mean": 8748.4,
"valid_targets_min": 7035
},
{
"epoch": 1.4411247803163445,
"grad_norm": 0.5065259706681324,
"learning_rate": 3.865985597669478e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32165688276290894,
"step": 820,
"valid_targets_mean": 8167.2,
"valid_targets_min": 6935
},
{
"epoch": 1.4499121265377855,
"grad_norm": 0.5235301993054804,
"learning_rate": 3.8628129884281034e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32480478286743164,
"step": 825,
"valid_targets_mean": 7586.2,
"valid_targets_min": 6637
},
{
"epoch": 1.4586994727592266,
"grad_norm": 0.45764897709254765,
"learning_rate": 3.859604596552074e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31234073638916016,
"step": 830,
"valid_targets_mean": 8294.1,
"valid_targets_min": 4643
},
{
"epoch": 1.4674868189806678,
"grad_norm": 0.4819891269065734,
"learning_rate": 3.8563604836711474e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018292188644409,
"step": 835,
"valid_targets_mean": 7926.1,
"valid_targets_min": 7208
},
{
"epoch": 1.476274165202109,
"grad_norm": 0.4548945218238035,
"learning_rate": 3.8530807121012446e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30471688508987427,
"step": 840,
"valid_targets_mean": 7810.9,
"valid_targets_min": 7383
},
{
"epoch": 1.4850615114235501,
"grad_norm": 0.5069039765101178,
"learning_rate": 3.849765344843251e-05,
"loss": 0.3214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32281768321990967,
"step": 845,
"valid_targets_mean": 7744.0,
"valid_targets_min": 6792
},
{
"epoch": 1.4938488576449913,
"grad_norm": 0.4353328346005066,
"learning_rate": 3.8464144455818065e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31245318055152893,
"step": 850,
"valid_targets_mean": 8749.6,
"valid_targets_min": 6404
},
{
"epoch": 1.5026362038664325,
"grad_norm": 0.5154934910092297,
"learning_rate": 3.8430280786840844e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092312216758728,
"step": 855,
"valid_targets_mean": 7474.7,
"valid_targets_min": 6443
},
{
"epoch": 1.5114235500878734,
"grad_norm": 0.4717707322137572,
"learning_rate": 3.83960630919855e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33252573013305664,
"step": 860,
"valid_targets_mean": 7726.3,
"valid_targets_min": 6303
},
{
"epoch": 1.5202108963093146,
"grad_norm": 0.4285070301543767,
"learning_rate": 3.836149202853718e-05,
"loss": 0.3201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3279268443584442,
"step": 865,
"valid_targets_mean": 7570.2,
"valid_targets_min": 6998
},
{
"epoch": 1.5289982425307556,
"grad_norm": 0.5108276009439777,
"learning_rate": 3.8326568260568835e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33991026878356934,
"step": 870,
"valid_targets_mean": 7096.4,
"valid_targets_min": 889
},
{
"epoch": 1.5377855887521967,
"grad_norm": 0.5141325486455165,
"learning_rate": 3.82912924589285e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30574706196784973,
"step": 875,
"valid_targets_mean": 7673.6,
"valid_targets_min": 6749
},
{
"epoch": 1.546572934973638,
"grad_norm": 0.47625262382472705,
"learning_rate": 3.825566530122638e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31097936630249023,
"step": 880,
"valid_targets_mean": 7730.6,
"valid_targets_min": 6901
},
{
"epoch": 1.555360281195079,
"grad_norm": 0.5075543716763415,
"learning_rate": 3.8219687471821896e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3260986804962158,
"step": 885,
"valid_targets_mean": 7240.1,
"valid_targets_min": 2559
},
{
"epoch": 1.5641476274165202,
"grad_norm": 0.4684436719897207,
"learning_rate": 3.818335966181045e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3189481496810913,
"step": 890,
"valid_targets_mean": 7754.8,
"valid_targets_min": 6983
},
{
"epoch": 1.5729349736379614,
"grad_norm": 0.4656673097955027,
"learning_rate": 3.814668256901022e-05,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31112608313560486,
"step": 895,
"valid_targets_mean": 7850.2,
"valid_targets_min": 6723
},
{
"epoch": 1.5817223198594026,
"grad_norm": 0.4384250396130361,
"learning_rate": 3.8109656897948726e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31039461493492126,
"step": 900,
"valid_targets_mean": 7324.2,
"valid_targets_min": 767
},
{
"epoch": 1.5905096660808435,
"grad_norm": 0.44267159794679833,
"learning_rate": 3.80722833598493e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3088935613632202,
"step": 905,
"valid_targets_mean": 7892.1,
"valid_targets_min": 6749
},
{
"epoch": 1.5992970123022847,
"grad_norm": 0.47691558808071355,
"learning_rate": 3.803456267261742e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3185274600982666,
"step": 910,
"valid_targets_mean": 7762.7,
"valid_targets_min": 7394
},
{
"epoch": 1.6080843585237259,
"grad_norm": 0.4618900297805469,
"learning_rate": 3.799649556082694e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30390602350234985,
"step": 915,
"valid_targets_mean": 7575.7,
"valid_targets_min": 6779
},
{
"epoch": 1.6168717047451668,
"grad_norm": 0.48363111062562336,
"learning_rate": 3.7958082755706135e-05,
"loss": 0.3184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203890323638916,
"step": 920,
"valid_targets_mean": 7784.1,
"valid_targets_min": 6591
},
{
"epoch": 1.625659050966608,
"grad_norm": 0.4401665133027058,
"learning_rate": 3.79193249951237e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.326861172914505,
"step": 925,
"valid_targets_mean": 7839.1,
"valid_targets_min": 7149
},
{
"epoch": 1.6344463971880492,
"grad_norm": 0.4244406950731562,
"learning_rate": 3.788022302357455e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063619136810303,
"step": 930,
"valid_targets_mean": 8331.9,
"valid_targets_min": 6867
},
{
"epoch": 1.6432337434094904,
"grad_norm": 0.5065832005235931,
"learning_rate": 3.784077759216551e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33527040481567383,
"step": 935,
"valid_targets_mean": 8369.5,
"valid_targets_min": 6595
},
{
"epoch": 1.6520210896309315,
"grad_norm": 0.38976211524282217,
"learning_rate": 3.7800989458600906e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886279821395874,
"step": 940,
"valid_targets_mean": 7513.3,
"valid_targets_min": 2858
},
{
"epoch": 1.6608084358523727,
"grad_norm": 0.4624244101065446,
"learning_rate": 3.776085938716801e-05,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3003271222114563,
"step": 945,
"valid_targets_mean": 7507.2,
"valid_targets_min": 6571
},
{
"epoch": 1.6695957820738139,
"grad_norm": 0.49790210807369195,
"learning_rate": 3.7720388148722336e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3175293803215027,
"step": 950,
"valid_targets_mean": 8316.7,
"valid_targets_min": 6720
},
{
"epoch": 1.6783831282952548,
"grad_norm": 0.440482172085147,
"learning_rate": 3.7679576520672866e-05,
"loss": 0.3053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30894142389297485,
"step": 955,
"valid_targets_mean": 7769.9,
"valid_targets_min": 6443
},
{
"epoch": 1.687170474516696,
"grad_norm": 0.4375270693805628,
"learning_rate": 3.76384252869671e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30674490332603455,
"step": 960,
"valid_targets_mean": 7664.5,
"valid_targets_min": 6381
},
{
"epoch": 1.695957820738137,
"grad_norm": 0.4268514111495579,
"learning_rate": 3.7596935238076e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31081438064575195,
"step": 965,
"valid_targets_mean": 7781.6,
"valid_targets_min": 7169
},
{
"epoch": 1.7047451669595781,
"grad_norm": 0.41848391215544556,
"learning_rate": 3.755510717097877e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3070789575576782,
"step": 970,
"valid_targets_mean": 7771.7,
"valid_targets_min": 6903
},
{
"epoch": 1.7135325131810193,
"grad_norm": 0.38149791836038105,
"learning_rate": 3.751294188914763e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30293750762939453,
"step": 975,
"valid_targets_mean": 8644.6,
"valid_targets_min": 6659
},
{
"epoch": 1.7223198594024605,
"grad_norm": 0.4107500940993902,
"learning_rate": 3.74704402025323e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320509672164917,
"step": 980,
"valid_targets_mean": 7373.2,
"valid_targets_min": 735
},
{
"epoch": 1.7311072056239016,
"grad_norm": 0.47456518227912814,
"learning_rate": 3.742760292754448e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3110986649990082,
"step": 985,
"valid_targets_mean": 7610.0,
"valid_targets_min": 6580
},
{
"epoch": 1.7398945518453428,
"grad_norm": 0.4804039533298582,
"learning_rate": 3.738443088704217e-05,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3051522970199585,
"step": 990,
"valid_targets_mean": 7695.4,
"valid_targets_min": 6921
},
{
"epoch": 1.748681898066784,
"grad_norm": 0.413409711024688,
"learning_rate": 3.7340924910313856e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31139689683914185,
"step": 995,
"valid_targets_mean": 8237.9,
"valid_targets_min": 5829
},
{
"epoch": 1.757469244288225,
"grad_norm": 0.48349747289345335,
"learning_rate": 3.7297085833062567e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30862659215927124,
"step": 1000,
"valid_targets_mean": 7671.2,
"valid_targets_min": 6818
},
{
"epoch": 1.766256590509666,
"grad_norm": 0.4556312359385941,
"learning_rate": 3.725291449738984e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3119673728942871,
"step": 1005,
"valid_targets_mean": 7820.5,
"valid_targets_min": 6973
},
{
"epoch": 1.775043936731107,
"grad_norm": 0.4732905673565096,
"learning_rate": 3.720841175177954e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128761649131775,
"step": 1010,
"valid_targets_mean": 7487.6,
"valid_targets_min": 6949
},
{
"epoch": 1.7838312829525482,
"grad_norm": 0.4360920490955908,
"learning_rate": 3.716357845108157e-05,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.312790185213089,
"step": 1015,
"valid_targets_mean": 7345.1,
"valid_targets_min": 1033
},
{
"epoch": 1.7926186291739894,
"grad_norm": 0.3929791909563157,
"learning_rate": 3.711841545649543e-05,
"loss": 0.313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148069977760315,
"step": 1020,
"valid_targets_mean": 8261.2,
"valid_targets_min": 7082
},
{
"epoch": 1.8014059753954306,
"grad_norm": 0.48748675844958406,
"learning_rate": 3.707292363555368e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32383400201797485,
"step": 1025,
"valid_targets_mean": 7643.5,
"valid_targets_min": 6629
},
{
"epoch": 1.8101933216168717,
"grad_norm": 0.41484975733955637,
"learning_rate": 3.702710386210531e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31957483291625977,
"step": 1030,
"valid_targets_mean": 7626.9,
"valid_targets_min": 6961
},
{
"epoch": 1.818980667838313,
"grad_norm": 0.4464507451663518,
"learning_rate": 3.698095701629888e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.326063334941864,
"step": 1035,
"valid_targets_mean": 8113.2,
"valid_targets_min": 7451
},
{
"epoch": 1.827768014059754,
"grad_norm": 0.45364640899190156,
"learning_rate": 3.6934483984565684e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3152083158493042,
"step": 1040,
"valid_targets_mean": 8248.0,
"valid_targets_min": 6075
},
{
"epoch": 1.836555360281195,
"grad_norm": 0.42820910363555187,
"learning_rate": 3.688768565960271e-05,
"loss": 0.3142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32458916306495667,
"step": 1045,
"valid_targets_mean": 8503.2,
"valid_targets_min": 7300
},
{
"epoch": 1.8453427065026362,
"grad_norm": 0.43586147124853236,
"learning_rate": 3.6840562940355456e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304810106754303,
"step": 1050,
"valid_targets_mean": 7810.0,
"valid_targets_min": 6889
},
{
"epoch": 1.8541300527240774,
"grad_norm": 0.428268483581941,
"learning_rate": 3.679311673200069e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3349687457084656,
"step": 1055,
"valid_targets_mean": 8437.2,
"valid_targets_min": 6462
},
{
"epoch": 1.8629173989455183,
"grad_norm": 0.456980102686238,
"learning_rate": 3.674534794592907e-05,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3136439919471741,
"step": 1060,
"valid_targets_mean": 7714.3,
"valid_targets_min": 7094
},
{
"epoch": 1.8717047451669595,
"grad_norm": 0.38144903531815577,
"learning_rate": 3.66972574997276e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29975107312202454,
"step": 1065,
"valid_targets_mean": 9710.9,
"valid_targets_min": 7367
},
{
"epoch": 1.8804920913884007,
"grad_norm": 0.43469010555959436,
"learning_rate": 3.664884631716207e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3089476227760315,
"step": 1070,
"valid_targets_mean": 8081.8,
"valid_targets_min": 6677
},
{
"epoch": 1.8892794376098418,
"grad_norm": 0.4334009291737787,
"learning_rate": 3.660011532815923e-05,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097480237483978,
"step": 1075,
"valid_targets_mean": 8850.0,
"valid_targets_min": 7388
},
{
"epoch": 1.898066783831283,
"grad_norm": 0.44431763802201296,
"learning_rate": 3.655106546878898e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3016049265861511,
"step": 1080,
"valid_targets_mean": 7862.3,
"valid_targets_min": 7087
},
{
"epoch": 1.9068541300527242,
"grad_norm": 0.41948895342338693,
"learning_rate": 3.6501697681246395e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30723023414611816,
"step": 1085,
"valid_targets_mean": 7580.1,
"valid_targets_min": 6580
},
{
"epoch": 1.9156414762741654,
"grad_norm": 0.4010740667676957,
"learning_rate": 3.645201291383359e-05,
"loss": 0.3153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.311009019613266,
"step": 1090,
"valid_targets_mean": 7486.8,
"valid_targets_min": 5588
},
{
"epoch": 1.9244288224956063,
"grad_norm": 0.45122299388247816,
"learning_rate": 3.640201212094153e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3017200529575348,
"step": 1095,
"valid_targets_mean": 7640.5,
"valid_targets_min": 6763
},
{
"epoch": 1.9332161687170475,
"grad_norm": 0.48626565470320493,
"learning_rate": 3.635169626303168e-05,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3185763955116272,
"step": 1100,
"valid_targets_mean": 7626.3,
"valid_targets_min": 6673
},
{
"epoch": 1.9420035149384884,
"grad_norm": 0.4048826995530806,
"learning_rate": 3.630106630661757e-05,
"loss": 0.3171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30462396144866943,
"step": 1105,
"valid_targets_mean": 8426.6,
"valid_targets_min": 6835
},
{
"epoch": 1.9507908611599296,
"grad_norm": 0.416307359936687,
"learning_rate": 3.625012322424623e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30712780356407166,
"step": 1110,
"valid_targets_mean": 8117.8,
"valid_targets_min": 1943
},
{
"epoch": 1.9595782073813708,
"grad_norm": 0.3993336489052123,
"learning_rate": 3.619886799447951e-05,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3055635690689087,
"step": 1115,
"valid_targets_mean": 8382.2,
"valid_targets_min": 6900
},
{
"epoch": 1.968365553602812,
"grad_norm": 0.42615246784494065,
"learning_rate": 3.6147301601875254e-05,
"loss": 0.3125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3055585026741028,
"step": 1120,
"valid_targets_mean": 8223.8,
"valid_targets_min": 6858
},
{
"epoch": 1.9771528998242531,
"grad_norm": 0.4490236584014622,
"learning_rate": 3.609542503696842e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31063467264175415,
"step": 1125,
"valid_targets_mean": 8464.8,
"valid_targets_min": 5375
},
{
"epoch": 1.9859402460456943,
"grad_norm": 0.42772252919816145,
"learning_rate": 3.6043239296252044e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3156036138534546,
"step": 1130,
"valid_targets_mean": 7510.9,
"valid_targets_min": 6567
},
{
"epoch": 1.9947275922671355,
"grad_norm": 0.39384984278326785,
"learning_rate": 3.59907453821581e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3085365295410156,
"step": 1135,
"valid_targets_mean": 7640.1,
"valid_targets_min": 6847
},
{
"epoch": 2.0035149384885766,
"grad_norm": 0.44225905296388024,
"learning_rate": 3.593794430303824e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31107211112976074,
"step": 1140,
"valid_targets_mean": 7554.0,
"valid_targets_min": 5191
},
{
"epoch": 2.0123022847100174,
"grad_norm": 0.4575942842423528,
"learning_rate": 3.588483707314442e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3130021095275879,
"step": 1145,
"valid_targets_mean": 8116.2,
"valid_targets_min": 698
},
{
"epoch": 2.0210896309314585,
"grad_norm": 0.5030867471723578,
"learning_rate": 3.583142471260943e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3067258596420288,
"step": 1150,
"valid_targets_mean": 7758.1,
"valid_targets_min": 6711
},
{
"epoch": 2.0298769771528997,
"grad_norm": 0.39211236477001193,
"learning_rate": 3.577770824742728e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978590726852417,
"step": 1155,
"valid_targets_mean": 7327.9,
"valid_targets_min": 1850
},
{
"epoch": 2.038664323374341,
"grad_norm": 0.45256141444384423,
"learning_rate": 3.5723688709433514e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29615986347198486,
"step": 1160,
"valid_targets_mean": 7482.5,
"valid_targets_min": 5768
},
{
"epoch": 2.047451669595782,
"grad_norm": 0.46676125736458673,
"learning_rate": 3.566936713628538e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3241825997829437,
"step": 1165,
"valid_targets_mean": 9016.9,
"valid_targets_min": 6517
},
{
"epoch": 2.0562390158172232,
"grad_norm": 0.4187877737697206,
"learning_rate": 3.561474457144189e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3071352243423462,
"step": 1170,
"valid_targets_mean": 7480.2,
"valid_targets_min": 4237
},
{
"epoch": 2.0650263620386644,
"grad_norm": 0.3518349882625782,
"learning_rate": 3.55598220641438e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3100239038467407,
"step": 1175,
"valid_targets_mean": 8664.9,
"valid_targets_min": 6995
},
{
"epoch": 2.0738137082601056,
"grad_norm": 0.36943905423071605,
"learning_rate": 3.550460066939339e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29586344957351685,
"step": 1180,
"valid_targets_mean": 7798.0,
"valid_targets_min": 6979
},
{
"epoch": 2.0826010544815468,
"grad_norm": 0.42787395567576747,
"learning_rate": 3.544908144793431e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3031949996948242,
"step": 1185,
"valid_targets_mean": 7733.5,
"valid_targets_min": 6670
},
{
"epoch": 2.0913884007029875,
"grad_norm": 0.43552604464567035,
"learning_rate": 3.539326546623111e-05,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30863067507743835,
"step": 1190,
"valid_targets_mean": 7751.4,
"valid_targets_min": 6757
},
{
"epoch": 2.1001757469244287,
"grad_norm": 0.4294105847217134,
"learning_rate": 3.533715379644877e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29311901330947876,
"step": 1195,
"valid_targets_mean": 7684.4,
"valid_targets_min": 7058
},
{
"epoch": 2.10896309314587,
"grad_norm": 0.4207247429632229,
"learning_rate": 3.528074751643215e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2985104024410248,
"step": 1200,
"valid_targets_mean": 7601.2,
"valid_targets_min": 6562
},
{
"epoch": 2.117750439367311,
"grad_norm": 0.3732874962554062,
"learning_rate": 3.5224047709685236e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063611388206482,
"step": 1205,
"valid_targets_mean": 7761.4,
"valid_targets_min": 7049
},
{
"epoch": 2.126537785588752,
"grad_norm": 0.448230951970861,
"learning_rate": 3.516705546535036e-05,
"loss": 0.3158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3147931694984436,
"step": 1210,
"valid_targets_mean": 7646.8,
"valid_targets_min": 6300
},
{
"epoch": 2.1353251318101933,
"grad_norm": 0.4834980094825441,
"learning_rate": 3.510977187818725e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2965982258319855,
"step": 1215,
"valid_targets_mean": 7572.7,
"valid_targets_min": 6467
},
{
"epoch": 2.1441124780316345,
"grad_norm": 0.3844913906138571,
"learning_rate": 3.5052198048552034e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3124872148036957,
"step": 1220,
"valid_targets_mean": 8456.2,
"valid_targets_min": 7123
},
{
"epoch": 2.1528998242530757,
"grad_norm": 0.4471021182585841,
"learning_rate": 3.499433508237607e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3014095723628998,
"step": 1225,
"valid_targets_mean": 7605.4,
"valid_targets_min": 6890
},
{
"epoch": 2.161687170474517,
"grad_norm": 0.39860058420156974,
"learning_rate": 3.493618409114473e-05,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.312033474445343,
"step": 1230,
"valid_targets_mean": 7788.5,
"valid_targets_min": 7179
},
{
"epoch": 2.1704745166959576,
"grad_norm": 0.4467572727911706,
"learning_rate": 3.487774619187603e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30640843510627747,
"step": 1235,
"valid_targets_mean": 7773.8,
"valid_targets_min": 7052
},
{
"epoch": 2.1792618629173988,
"grad_norm": 0.3997396765921527,
"learning_rate": 3.4819022507099184e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31913310289382935,
"step": 1240,
"valid_targets_mean": 8639.9,
"valid_targets_min": 7285
},
{
"epoch": 2.18804920913884,
"grad_norm": 0.4000641776955986,
"learning_rate": 3.476001416483304e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31555551290512085,
"step": 1245,
"valid_targets_mean": 9298.2,
"valid_targets_min": 7236
},
{
"epoch": 2.196836555360281,
"grad_norm": 0.41208383607345306,
"learning_rate": 3.470072229856441e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31802457571029663,
"step": 1250,
"valid_targets_mean": 8020.3,
"valid_targets_min": 1033
},
{
"epoch": 2.2056239015817223,
"grad_norm": 0.4195318237967421,
"learning_rate": 3.4641148047226296e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3073643445968628,
"step": 1255,
"valid_targets_mean": 7782.1,
"valid_targets_min": 6665
},
{
"epoch": 2.2144112478031635,
"grad_norm": 0.40213398462418887,
"learning_rate": 3.458129255517601e-05,
"loss": 0.3096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3027478754520416,
"step": 1260,
"valid_targets_mean": 7899.5,
"valid_targets_min": 4269
},
{
"epoch": 2.2231985940246046,
"grad_norm": 0.42889700659379176,
"learning_rate": 3.45211569721732e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3163566589355469,
"step": 1265,
"valid_targets_mean": 7810.5,
"valid_targets_min": 7187
},
{
"epoch": 2.231985940246046,
"grad_norm": 0.46094118123987604,
"learning_rate": 3.446074245335775e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999768853187561,
"step": 1270,
"valid_targets_mean": 7666.0,
"valid_targets_min": 7186
},
{
"epoch": 2.240773286467487,
"grad_norm": 0.3786878856595145,
"learning_rate": 3.440005015922764e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2929559350013733,
"step": 1275,
"valid_targets_mean": 7560.2,
"valid_targets_min": 6789
},
{
"epoch": 2.249560632688928,
"grad_norm": 0.40495935423491064,
"learning_rate": 3.433908125561655e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30050337314605713,
"step": 1280,
"valid_targets_mean": 8417.1,
"valid_targets_min": 5375
},
{
"epoch": 2.2583479789103693,
"grad_norm": 0.4933512810932113,
"learning_rate": 3.427783691367158e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097958564758301,
"step": 1285,
"valid_targets_mean": 7632.8,
"valid_targets_min": 6582
},
{
"epoch": 2.26713532513181,
"grad_norm": 0.45052501289258173,
"learning_rate": 3.4216318309830695e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31090953946113586,
"step": 1290,
"valid_targets_mean": 7552.1,
"valid_targets_min": 6602
},
{
"epoch": 2.275922671353251,
"grad_norm": 0.40827626046366344,
"learning_rate": 3.4154526625800136e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.316741943359375,
"step": 1295,
"valid_targets_mean": 8403.2,
"valid_targets_min": 7188
},
{
"epoch": 2.2847100175746924,
"grad_norm": 0.3901372214673228,
"learning_rate": 3.40924630485317e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291498601436615,
"step": 1300,
"valid_targets_mean": 8731.1,
"valid_targets_min": 6914
},
{
"epoch": 2.2934973637961336,
"grad_norm": 0.4607594936052616,
"learning_rate": 3.4030128770199986e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31470581889152527,
"step": 1305,
"valid_targets_mean": 7488.9,
"valid_targets_min": 6678
},
{
"epoch": 2.3022847100175747,
"grad_norm": 0.4353904042040713,
"learning_rate": 3.3967524988179463e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3008217513561249,
"step": 1310,
"valid_targets_mean": 7801.6,
"valid_targets_min": 7101
},
{
"epoch": 2.311072056239016,
"grad_norm": 0.3982786148979641,
"learning_rate": 3.390465290502146e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3014106750488281,
"step": 1315,
"valid_targets_mean": 8752.8,
"valid_targets_min": 7398
},
{
"epoch": 2.319859402460457,
"grad_norm": 0.3931812519197794,
"learning_rate": 3.3841513728431116e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3188680410385132,
"step": 1320,
"valid_targets_mean": 8942.9,
"valid_targets_min": 7262
},
{
"epoch": 2.3286467486818982,
"grad_norm": 0.34925229293914345,
"learning_rate": 3.3778108671244117e-05,
"loss": 0.3055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3098894953727722,
"step": 1325,
"valid_targets_mean": 9421.9,
"valid_targets_min": 7103
},
{
"epoch": 2.3374340949033394,
"grad_norm": 0.4079734971148553,
"learning_rate": 3.371443895140343e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31103235483169556,
"step": 1330,
"valid_targets_mean": 7780.8,
"valid_targets_min": 7072
},
{
"epoch": 2.34622144112478,
"grad_norm": 0.4403653941114043,
"learning_rate": 3.365050579193594e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30240386724472046,
"step": 1335,
"valid_targets_mean": 7246.3,
"valid_targets_min": 967
},
{
"epoch": 2.3550087873462213,
"grad_norm": 0.4258857128840449,
"learning_rate": 3.3586310420928884e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3061680793762207,
"step": 1340,
"valid_targets_mean": 7177.9,
"valid_targets_min": 637
},
{
"epoch": 2.3637961335676625,
"grad_norm": 0.39912825352364323,
"learning_rate": 3.352185407150632e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30649226903915405,
"step": 1345,
"valid_targets_mean": 7716.2,
"valid_targets_min": 7084
},
{
"epoch": 2.3725834797891037,
"grad_norm": 0.38375183285614406,
"learning_rate": 3.3457137981805427e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3068873882293701,
"step": 1350,
"valid_targets_mean": 7820.7,
"valid_targets_min": 6638
},
{
"epoch": 2.381370826010545,
"grad_norm": 0.4734888672679818,
"learning_rate": 3.3392163394952694e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996982932090759,
"step": 1355,
"valid_targets_mean": 7900.8,
"valid_targets_min": 7090
},
{
"epoch": 2.390158172231986,
"grad_norm": 0.4257074824478925,
"learning_rate": 3.3326931559040084e-05,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3033141493797302,
"step": 1360,
"valid_targets_mean": 8719.5,
"valid_targets_min": 6891
},
{
"epoch": 2.398945518453427,
"grad_norm": 0.3983063674915521,
"learning_rate": 3.326144372710102e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3087483048439026,
"step": 1365,
"valid_targets_mean": 8207.4,
"valid_targets_min": 5826
},
{
"epoch": 2.4077328646748684,
"grad_norm": 0.38937049144098784,
"learning_rate": 3.3195701157086354e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29816991090774536,
"step": 1370,
"valid_targets_mean": 7648.9,
"valid_targets_min": 7040
},
{
"epoch": 2.4165202108963095,
"grad_norm": 0.41374920307885404,
"learning_rate": 3.312970511184017e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29219090938568115,
"step": 1375,
"valid_targets_mean": 7774.8,
"valid_targets_min": 6954
},
{
"epoch": 2.4253075571177503,
"grad_norm": 0.39068918900663724,
"learning_rate": 3.306345685907553e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305525004863739,
"step": 1380,
"valid_targets_mean": 7558.7,
"valid_targets_min": 6434
},
{
"epoch": 2.4340949033391914,
"grad_norm": 0.371881435123146,
"learning_rate": 3.299695767135016e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3058660626411438,
"step": 1385,
"valid_targets_mean": 7739.2,
"valid_targets_min": 6924
},
{
"epoch": 2.4428822495606326,
"grad_norm": 0.38458825321625745,
"learning_rate": 3.293020882604194e-05,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30228298902511597,
"step": 1390,
"valid_targets_mean": 8752.3,
"valid_targets_min": 6899
},
{
"epoch": 2.4516695957820738,
"grad_norm": 0.43595201707714715,
"learning_rate": 3.2863211605324416e-05,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30637264251708984,
"step": 1395,
"valid_targets_mean": 8108.2,
"valid_targets_min": 6679
},
{
"epoch": 2.460456942003515,
"grad_norm": 0.3837177685039735,
"learning_rate": 3.2795967296142185e-05,
"loss": 0.3052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3002673387527466,
"step": 1400,
"valid_targets_mean": 8512.9,
"valid_targets_min": 7227
},
{
"epoch": 2.469244288224956,
"grad_norm": 0.38223835626371655,
"learning_rate": 3.272847719018612e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2972228527069092,
"step": 1405,
"valid_targets_mean": 8684.6,
"valid_targets_min": 7125
},
{
"epoch": 2.4780316344463973,
"grad_norm": 0.3777714976567161,
"learning_rate": 3.2660742583868585e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080081045627594,
"step": 1410,
"valid_targets_mean": 8428.3,
"valid_targets_min": 6596
},
{
"epoch": 2.4868189806678385,
"grad_norm": 0.4311154393993648,
"learning_rate": 3.259276477829855e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28569990396499634,
"step": 1415,
"valid_targets_mean": 7225.0,
"valid_targets_min": 791
},
{
"epoch": 2.4956063268892796,
"grad_norm": 0.3830582502669011,
"learning_rate": 3.2524545079256554e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2976120114326477,
"step": 1420,
"valid_targets_mean": 7598.9,
"valid_targets_min": 6837
},
{
"epoch": 2.5043936731107204,
"grad_norm": 0.4094112468037244,
"learning_rate": 3.2456084797169695e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30441173911094666,
"step": 1425,
"valid_targets_mean": 7598.8,
"valid_targets_min": 6490
},
{
"epoch": 2.5131810193321615,
"grad_norm": 0.38103563079986086,
"learning_rate": 3.238738524708636e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29411470890045166,
"step": 1430,
"valid_targets_mean": 8039.4,
"valid_targets_min": 6835
},
{
"epoch": 2.5219683655536027,
"grad_norm": 0.35589307131604775,
"learning_rate": 3.2318447748651054e-05,
"loss": 0.3021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29991233348846436,
"step": 1435,
"valid_targets_mean": 7943.8,
"valid_targets_min": 7488
},
{
"epoch": 2.530755711775044,
"grad_norm": 0.43714729308284495,
"learning_rate": 3.2249273626079005e-05,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009275794029236,
"step": 1440,
"valid_targets_mean": 7560.6,
"valid_targets_min": 6313
},
{
"epoch": 2.539543057996485,
"grad_norm": 0.41461305927012404,
"learning_rate": 3.217986420813073e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30489039421081543,
"step": 1445,
"valid_targets_mean": 7940.9,
"valid_targets_min": 7048
},
{
"epoch": 2.5483304042179262,
"grad_norm": 0.39013671195410066,
"learning_rate": 3.211022082808652e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3109816908836365,
"step": 1450,
"valid_targets_mean": 7563.9,
"valid_targets_min": 6580
},
{
"epoch": 2.5571177504393674,
"grad_norm": 0.4147791452090644,
"learning_rate": 3.204034482372081e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3086916506290436,
"step": 1455,
"valid_targets_mean": 7745.0,
"valid_targets_min": 7157
},
{
"epoch": 2.5659050966608086,
"grad_norm": 0.3864245220712862,
"learning_rate": 3.197023753727655e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3015146255493164,
"step": 1460,
"valid_targets_mean": 8278.2,
"valid_targets_min": 6836
},
{
"epoch": 2.5746924428822497,
"grad_norm": 0.3974199065384782,
"learning_rate": 3.18999003154393e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3117097020149231,
"step": 1465,
"valid_targets_mean": 7764.9,
"valid_targets_min": 6630
},
{
"epoch": 2.5834797891036905,
"grad_norm": 0.4243565407207841,
"learning_rate": 3.1829334509311496e-05,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30094391107559204,
"step": 1470,
"valid_targets_mean": 7812.8,
"valid_targets_min": 6861
},
{
"epoch": 2.5922671353251316,
"grad_norm": 0.40284583779979793,
"learning_rate": 3.175854147438638e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32183435559272766,
"step": 1475,
"valid_targets_mean": 8270.9,
"valid_targets_min": 6766
},
{
"epoch": 2.601054481546573,
"grad_norm": 0.39808650070592766,
"learning_rate": 3.1687522570522055e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3073437213897705,
"step": 1480,
"valid_targets_mean": 7517.8,
"valid_targets_min": 3926
},
{
"epoch": 2.609841827768014,
"grad_norm": 0.4603673602872501,
"learning_rate": 3.1616279161915295e-05,
"loss": 0.3076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31150487065315247,
"step": 1485,
"valid_targets_mean": 7706.1,
"valid_targets_min": 6610
},
{
"epoch": 2.618629173989455,
"grad_norm": 0.38907395491747443,
"learning_rate": 3.1544812617075384e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30694928765296936,
"step": 1490,
"valid_targets_mean": 7400.9,
"valid_targets_min": 6690
},
{
"epoch": 2.6274165202108963,
"grad_norm": 0.37857824502065196,
"learning_rate": 3.14731243087978e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30862754583358765,
"step": 1495,
"valid_targets_mean": 7636.0,
"valid_targets_min": 6961
},
{
"epoch": 2.6362038664323375,
"grad_norm": 0.37364134233828533,
"learning_rate": 3.140121561413789e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982473373413086,
"step": 1500,
"valid_targets_mean": 8630.9,
"valid_targets_min": 7356
},
{
"epoch": 2.6449912126537787,
"grad_norm": 0.37894045420149564,
"learning_rate": 3.132908791438434e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.311771959066391,
"step": 1505,
"valid_targets_mean": 7846.6,
"valid_targets_min": 7249
},
{
"epoch": 2.65377855887522,
"grad_norm": 0.39359306830855695,
"learning_rate": 3.125674259503273e-05,
"loss": 0.3062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3034271001815796,
"step": 1510,
"valid_targets_mean": 7687.1,
"valid_targets_min": 6152
},
{
"epoch": 2.6625659050966606,
"grad_norm": 0.3198160782063454,
"learning_rate": 3.1184181045758854e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2969781160354614,
"step": 1515,
"valid_targets_mean": 8732.8,
"valid_targets_min": 6926
},
{
"epoch": 2.671353251318102,
"grad_norm": 0.43721287392537767,
"learning_rate": 3.111140466039205e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31991803646087646,
"step": 1520,
"valid_targets_mean": 8241.2,
"valid_targets_min": 7027
},
{
"epoch": 2.680140597539543,
"grad_norm": 0.3759484607611042,
"learning_rate": 3.103841483688844e-05,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31809115409851074,
"step": 1525,
"valid_targets_mean": 7407.9,
"valid_targets_min": 1051
},
{
"epoch": 2.688927943760984,
"grad_norm": 0.38227597925355516,
"learning_rate": 3.096521297730406e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.296236515045166,
"step": 1530,
"valid_targets_mean": 7841.4,
"valid_targets_min": 7067
},
{
"epoch": 2.6977152899824253,
"grad_norm": 0.4440775072110787,
"learning_rate": 3.089180048776792e-05,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31530511379241943,
"step": 1535,
"valid_targets_mean": 7497.6,
"valid_targets_min": 6947
},
{
"epoch": 2.7065026362038664,
"grad_norm": 0.4044154429897798,
"learning_rate": 3.081817877845502e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.313349187374115,
"step": 1540,
"valid_targets_mean": 7869.1,
"valid_targets_min": 668
},
{
"epoch": 2.7152899824253076,
"grad_norm": 0.35095011195614556,
"learning_rate": 3.074434926355923e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30906468629837036,
"step": 1545,
"valid_targets_mean": 7672.9,
"valid_targets_min": 6969
},
{
"epoch": 2.724077328646749,
"grad_norm": 0.37377485319005543,
"learning_rate": 3.0670313361266165e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3094746768474579,
"step": 1550,
"valid_targets_mean": 9361.6,
"valid_targets_min": 6725
},
{
"epoch": 2.73286467486819,
"grad_norm": 0.39609784345383675,
"learning_rate": 3.05960724937259e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3020004630088806,
"step": 1555,
"valid_targets_mean": 7593.3,
"valid_targets_min": 6153
},
{
"epoch": 2.7416520210896307,
"grad_norm": 0.39372450689875543,
"learning_rate": 3.0521628087025675e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30635249614715576,
"step": 1560,
"valid_targets_mean": 7280.9,
"valid_targets_min": 792
},
{
"epoch": 2.7504393673110723,
"grad_norm": 0.4546147869833877,
"learning_rate": 3.04469815711625e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31082868576049805,
"step": 1565,
"valid_targets_mean": 7271.9,
"valid_targets_min": 2103
},
{
"epoch": 2.759226713532513,
"grad_norm": 0.385653663876873,
"learning_rate": 3.037213438001569e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3087978959083557,
"step": 1570,
"valid_targets_mean": 7855.4,
"valid_targets_min": 6830
},
{
"epoch": 2.768014059753954,
"grad_norm": 0.3638152210796052,
"learning_rate": 3.0297087951319315e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870416045188904,
"step": 1575,
"valid_targets_mean": 8318.2,
"valid_targets_min": 7204
},
{
"epoch": 2.7768014059753954,
"grad_norm": 0.40554492088420635,
"learning_rate": 3.0221843726634587e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3099740445613861,
"step": 1580,
"valid_targets_mean": 7761.8,
"valid_targets_min": 7044
},
{
"epoch": 2.7855887521968365,
"grad_norm": 0.4369178667308916,
"learning_rate": 3.0146403151322156e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3091489374637604,
"step": 1585,
"valid_targets_mean": 7639.2,
"valid_targets_min": 7064
},
{
"epoch": 2.7943760984182777,
"grad_norm": 0.3801491855074197,
"learning_rate": 3.0070767674514355e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32035768032073975,
"step": 1590,
"valid_targets_mean": 7785.9,
"valid_targets_min": 7097
},
{
"epoch": 2.803163444639719,
"grad_norm": 0.3575958406948729,
"learning_rate": 2.999493874908738e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2941886782646179,
"step": 1595,
"valid_targets_mean": 8453.9,
"valid_targets_min": 6573
},
{
"epoch": 2.81195079086116,
"grad_norm": 0.40910005037027813,
"learning_rate": 2.9918917831633362e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30973154306411743,
"step": 1600,
"valid_targets_mean": 7694.0,
"valid_targets_min": 7177
},
{
"epoch": 2.820738137082601,
"grad_norm": 0.40322666910100285,
"learning_rate": 2.9842706382432375e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833307385444641,
"step": 1605,
"valid_targets_mean": 7846.4,
"valid_targets_min": 6911
},
{
"epoch": 2.8295254833040424,
"grad_norm": 0.4328858344953751,
"learning_rate": 2.9766305865424435e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29956915974617004,
"step": 1610,
"valid_targets_mean": 7706.2,
"valid_targets_min": 6440
},
{
"epoch": 2.838312829525483,
"grad_norm": 0.3862746865257901,
"learning_rate": 2.9689717748181313e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30747565627098083,
"step": 1615,
"valid_targets_mean": 7839.2,
"valid_targets_min": 6714
},
{
"epoch": 2.8471001757469243,
"grad_norm": 0.35814076275660855,
"learning_rate": 2.9612943501878412e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956044673919678,
"step": 1620,
"valid_targets_mean": 8089.6,
"valid_targets_min": 6923
},
{
"epoch": 2.8558875219683655,
"grad_norm": 0.3575476615779183,
"learning_rate": 2.953598460126645e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2984451949596405,
"step": 1625,
"valid_targets_mean": 7583.4,
"valid_targets_min": 5811
},
{
"epoch": 2.8646748681898067,
"grad_norm": 0.364251095654717,
"learning_rate": 2.945884252464316e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29613763093948364,
"step": 1630,
"valid_targets_mean": 7839.7,
"valid_targets_min": 7332
},
{
"epoch": 2.873462214411248,
"grad_norm": 0.37913775865436633,
"learning_rate": 2.938151875382489e-05,
"loss": 0.306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3077976107597351,
"step": 1635,
"valid_targets_mean": 7706.9,
"valid_targets_min": 6864
},
{
"epoch": 2.882249560632689,
"grad_norm": 0.3502794052061173,
"learning_rate": 2.9304014774118153e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29528719186782837,
"step": 1640,
"valid_targets_mean": 9250.9,
"valid_targets_min": 6288
},
{
"epoch": 2.89103690685413,
"grad_norm": 0.40036405725266105,
"learning_rate": 2.922633207429106e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30659887194633484,
"step": 1645,
"valid_targets_mean": 7710.6,
"valid_targets_min": 7033
},
{
"epoch": 2.899824253075571,
"grad_norm": 0.3954524870419218,
"learning_rate": 2.9148472146544757e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851497232913971,
"step": 1650,
"valid_targets_mean": 7339.9,
"valid_targets_min": 2858
},
{
"epoch": 2.9086115992970125,
"grad_norm": 0.4016749884162129,
"learning_rate": 2.907043648648474e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3091953992843628,
"step": 1655,
"valid_targets_mean": 8124.5,
"valid_targets_min": 7189
},
{
"epoch": 2.9173989455184532,
"grad_norm": 0.34302336945820733,
"learning_rate": 2.8992226593092135e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290097177028656,
"step": 1660,
"valid_targets_mean": 8428.9,
"valid_targets_min": 6961
},
{
"epoch": 2.9261862917398944,
"grad_norm": 0.3689837782516461,
"learning_rate": 2.8913843968694907e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28554922342300415,
"step": 1665,
"valid_targets_mean": 7704.6,
"valid_targets_min": 6749
},
{
"epoch": 2.9349736379613356,
"grad_norm": 0.3737483155346716,
"learning_rate": 2.8835290118938995e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31530293822288513,
"step": 1670,
"valid_targets_mean": 8266.5,
"valid_targets_min": 5479
},
{
"epoch": 2.9437609841827768,
"grad_norm": 0.37716353251821727,
"learning_rate": 2.8756566552759392e-05,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30051523447036743,
"step": 1675,
"valid_targets_mean": 8571.9,
"valid_targets_min": 6853
},
{
"epoch": 2.952548330404218,
"grad_norm": 0.3436480692484697,
"learning_rate": 2.8677674782351164e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3064003586769104,
"step": 1680,
"valid_targets_mean": 8446.5,
"valid_targets_min": 6955
},
{
"epoch": 2.961335676625659,
"grad_norm": 0.36327514641467545,
"learning_rate": 2.85986163231404e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.323203444480896,
"step": 1685,
"valid_targets_mean": 8383.3,
"valid_targets_min": 6713
},
{
"epoch": 2.9701230228471003,
"grad_norm": 0.36618297685578105,
"learning_rate": 2.85193926937551e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3078553378582001,
"step": 1690,
"valid_targets_mean": 7677.2,
"valid_targets_min": 6942
},
{
"epoch": 2.9789103690685415,
"grad_norm": 0.4015501740277631,
"learning_rate": 2.8440005415996e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30818092823028564,
"step": 1695,
"valid_targets_mean": 8363.5,
"valid_targets_min": 7110
},
{
"epoch": 2.9876977152899826,
"grad_norm": 0.37457441630305677,
"learning_rate": 2.8360456014807353e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29534947872161865,
"step": 1700,
"valid_targets_mean": 7426.0,
"valid_targets_min": 889
},
{
"epoch": 2.9964850615114234,
"grad_norm": 0.3589323367469997,
"learning_rate": 2.828074601824762e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29085928201675415,
"step": 1705,
"valid_targets_mean": 7558.2,
"valid_targets_min": 6764
},
{
"epoch": 3.0052724077328645,
"grad_norm": 0.3843537170537307,
"learning_rate": 2.820087695746015e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3022106885910034,
"step": 1710,
"valid_targets_mean": 7672.3,
"valid_targets_min": 6491
},
{
"epoch": 3.0140597539543057,
"grad_norm": 0.39461466590743977,
"learning_rate": 2.8120850366643707e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2965931296348572,
"step": 1715,
"valid_targets_mean": 7666.1,
"valid_targets_min": 7020
},
{
"epoch": 3.022847100175747,
"grad_norm": 0.3823839208720008,
"learning_rate": 2.804066778302307e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29734212160110474,
"step": 1720,
"valid_targets_mean": 7955.2,
"valid_targets_min": 6914
},
{
"epoch": 3.031634446397188,
"grad_norm": 0.37794281371658167,
"learning_rate": 2.7960330746819462e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050759434700012,
"step": 1725,
"valid_targets_mean": 7589.2,
"valid_targets_min": 6396
},
{
"epoch": 3.040421792618629,
"grad_norm": 0.3834396543175821,
"learning_rate": 2.7879840801220967e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29034867882728577,
"step": 1730,
"valid_targets_mean": 7920.9,
"valid_targets_min": 7403
},
{
"epoch": 3.0492091388400704,
"grad_norm": 0.39698828721280216,
"learning_rate": 2.7799199492352893e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966341972351074,
"step": 1735,
"valid_targets_mean": 7744.3,
"valid_targets_min": 7105
},
{
"epoch": 3.0579964850615116,
"grad_norm": 0.3324961667234077,
"learning_rate": 2.7718408369248093e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2905833125114441,
"step": 1740,
"valid_targets_mean": 7800.8,
"valid_targets_min": 6576
},
{
"epoch": 3.0667838312829527,
"grad_norm": 0.3824356525112284,
"learning_rate": 2.7637468983817167e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2963569462299347,
"step": 1745,
"valid_targets_mean": 7915.6,
"valid_targets_min": 7207
},
{
"epoch": 3.0755711775043935,
"grad_norm": 0.40122996258740906,
"learning_rate": 2.7556382890818682e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2929661273956299,
"step": 1750,
"valid_targets_mean": 7726.7,
"valid_targets_min": 7103
},
{
"epoch": 3.0843585237258346,
"grad_norm": 0.3492966408385829,
"learning_rate": 2.7475151647829314e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30222034454345703,
"step": 1755,
"valid_targets_mean": 7625.8,
"valid_targets_min": 7081
},
{
"epoch": 3.093145869947276,
"grad_norm": 0.35717867792128094,
"learning_rate": 2.7393776815213903e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30564767122268677,
"step": 1760,
"valid_targets_mean": 8366.2,
"valid_targets_min": 7331
},
{
"epoch": 3.101933216168717,
"grad_norm": 0.3836591053710375,
"learning_rate": 2.731225995609548e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30902570486068726,
"step": 1765,
"valid_targets_mean": 7731.9,
"valid_targets_min": 6950
},
{
"epoch": 3.110720562390158,
"grad_norm": 0.37827048413037573,
"learning_rate": 2.723060263632527e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3042601943016052,
"step": 1770,
"valid_targets_mean": 7609.2,
"valid_targets_min": 6740
},
{
"epoch": 3.1195079086115993,
"grad_norm": 0.4074776201300159,
"learning_rate": 2.714880642445259e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30564433336257935,
"step": 1775,
"valid_targets_mean": 7801.8,
"valid_targets_min": 6795
},
{
"epoch": 3.1282952548330405,
"grad_norm": 0.3994404944539335,
"learning_rate": 2.706687289169472e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3061908185482025,
"step": 1780,
"valid_targets_mean": 7779.4,
"valid_targets_min": 7008
},
{
"epoch": 3.1370826010544817,
"grad_norm": 0.36913628829380746,
"learning_rate": 2.698480361190674e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005139231681824,
"step": 1785,
"valid_targets_mean": 7761.8,
"valid_targets_min": 6357
},
{
"epoch": 3.145869947275923,
"grad_norm": 0.3804227293169359,
"learning_rate": 2.6902600161551273e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2909207046031952,
"step": 1790,
"valid_targets_mean": 7628.8,
"valid_targets_min": 6808
},
{
"epoch": 3.1546572934973636,
"grad_norm": 0.38125704699521695,
"learning_rate": 2.6820264119668215e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2874659299850464,
"step": 1795,
"valid_targets_mean": 7767.1,
"valid_targets_min": 7159
},
{
"epoch": 3.1634446397188047,
"grad_norm": 0.3894373804595348,
"learning_rate": 2.6737797067844403e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2974281907081604,
"step": 1800,
"valid_targets_mean": 7478.9,
"valid_targets_min": 6390
},
{
"epoch": 3.172231985940246,
"grad_norm": 0.4032779429245858,
"learning_rate": 2.6655200590183235e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894044816493988,
"step": 1805,
"valid_targets_mean": 7810.5,
"valid_targets_min": 6847
},
{
"epoch": 3.181019332161687,
"grad_norm": 0.39036275005771637,
"learning_rate": 2.6572476273274253e-05,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30358803272247314,
"step": 1810,
"valid_targets_mean": 7659.1,
"valid_targets_min": 6626
},
{
"epoch": 3.1898066783831283,
"grad_norm": 0.4033198742934059,
"learning_rate": 2.6489625706162626e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30405354499816895,
"step": 1815,
"valid_targets_mean": 7780.9,
"valid_targets_min": 6679
},
{
"epoch": 3.1985940246045694,
"grad_norm": 0.3896938362514825,
"learning_rate": 2.6406650480318675e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3113795518875122,
"step": 1820,
"valid_targets_mean": 7647.8,
"valid_targets_min": 7075
},
{
"epoch": 3.2073813708260106,
"grad_norm": 0.3622062948493469,
"learning_rate": 2.6323552189607277e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.306094765663147,
"step": 1825,
"valid_targets_mean": 8025.8,
"valid_targets_min": 6326
},
{
"epoch": 3.2161687170474518,
"grad_norm": 0.4064555280023506,
"learning_rate": 2.6240332430257254e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2962179183959961,
"step": 1830,
"valid_targets_mean": 7738.6,
"valid_targets_min": 7306
},
{
"epoch": 3.224956063268893,
"grad_norm": 0.3633555051355748,
"learning_rate": 2.61569928008307e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3019287884235382,
"step": 1835,
"valid_targets_mean": 8410.9,
"valid_targets_min": 6567
},
{
"epoch": 3.233743409490334,
"grad_norm": 0.40839867807158176,
"learning_rate": 2.6073534902192295e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2952163517475128,
"step": 1840,
"valid_targets_mean": 7896.7,
"valid_targets_min": 7093
},
{
"epoch": 3.242530755711775,
"grad_norm": 0.38608334234814473,
"learning_rate": 2.598996033747855e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31258517503738403,
"step": 1845,
"valid_targets_mean": 8522.1,
"valid_targets_min": 7245
},
{
"epoch": 3.251318101933216,
"grad_norm": 0.37127080551402336,
"learning_rate": 2.5906270712066972e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3096095621585846,
"step": 1850,
"valid_targets_mean": 8455.1,
"valid_targets_min": 7211
},
{
"epoch": 3.260105448154657,
"grad_norm": 0.40216557395027774,
"learning_rate": 2.5822467633545305e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29827120900154114,
"step": 1855,
"valid_targets_mean": 7628.1,
"valid_targets_min": 6542
},
{
"epoch": 3.2688927943760984,
"grad_norm": 0.42644338680649757,
"learning_rate": 2.5738552711680575e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996917963027954,
"step": 1860,
"valid_targets_mean": 7396.6,
"valid_targets_min": 3281
},
{
"epoch": 3.2776801405975395,
"grad_norm": 0.3822821646569032,
"learning_rate": 2.5654527558388212e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30134713649749756,
"step": 1865,
"valid_targets_mean": 7653.9,
"valid_targets_min": 6719
},
{
"epoch": 3.2864674868189807,
"grad_norm": 0.37847842670001375,
"learning_rate": 2.5570393787701063e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3066447973251343,
"step": 1870,
"valid_targets_mean": 7816.2,
"valid_targets_min": 6870
},
{
"epoch": 3.295254833040422,
"grad_norm": 0.3655419814859327,
"learning_rate": 2.5486153015738412e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3025107979774475,
"step": 1875,
"valid_targets_mean": 9417.5,
"valid_targets_min": 6596
},
{
"epoch": 3.304042179261863,
"grad_norm": 0.35812507396382093,
"learning_rate": 2.5401806860674912e-05,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30119413137435913,
"step": 1880,
"valid_targets_mean": 8851.4,
"valid_targets_min": 7650
},
{
"epoch": 3.3128295254833042,
"grad_norm": 0.33731159764531526,
"learning_rate": 2.531735694270951e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2901797890663147,
"step": 1885,
"valid_targets_mean": 8558.3,
"valid_targets_min": 7196
},
{
"epoch": 3.3216168717047454,
"grad_norm": 0.35924506975423315,
"learning_rate": 2.5232804884034336e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28924497961997986,
"step": 1890,
"valid_targets_mean": 7621.5,
"valid_targets_min": 5768
},
{
"epoch": 3.330404217926186,
"grad_norm": 0.4077167610712946,
"learning_rate": 2.514815230880353e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894204258918762,
"step": 1895,
"valid_targets_mean": 7784.2,
"valid_targets_min": 7082
},
{
"epoch": 3.3391915641476273,
"grad_norm": 0.40138393301127867,
"learning_rate": 2.506340084310204e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30550941824913025,
"step": 1900,
"valid_targets_mean": 8926.8,
"valid_targets_min": 7692
},
{
"epoch": 3.3479789103690685,
"grad_norm": 0.42423632974581116,
"learning_rate": 2.497855211491441e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2958449423313141,
"step": 1905,
"valid_targets_mean": 7398.2,
"valid_targets_min": 6157
},
{
"epoch": 3.3567662565905096,
"grad_norm": 0.39701449366081437,
"learning_rate": 2.4893607754093467e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3140870928764343,
"step": 1910,
"valid_targets_mean": 7346.4,
"valid_targets_min": 941
},
{
"epoch": 3.365553602811951,
"grad_norm": 0.4032970315145587,
"learning_rate": 2.4808569392329066e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921169400215149,
"step": 1915,
"valid_targets_mean": 7636.4,
"valid_targets_min": 7047
},
{
"epoch": 3.374340949033392,
"grad_norm": 0.37613825543264184,
"learning_rate": 2.4723438663116692e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2972247004508972,
"step": 1920,
"valid_targets_mean": 7798.5,
"valid_targets_min": 7169
},
{
"epoch": 3.383128295254833,
"grad_norm": 0.3473944568774364,
"learning_rate": 2.4638217201726128e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29673564434051514,
"step": 1925,
"valid_targets_mean": 8248.6,
"valid_targets_min": 7295
},
{
"epoch": 3.3919156414762743,
"grad_norm": 0.37921512732872087,
"learning_rate": 2.4552906645170024e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3123595714569092,
"step": 1930,
"valid_targets_mean": 7522.9,
"valid_targets_min": 6181
},
{
"epoch": 3.4007029876977155,
"grad_norm": 0.4060893190215372,
"learning_rate": 2.4467508632172443e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30219995975494385,
"step": 1935,
"valid_targets_mean": 7820.9,
"valid_targets_min": 7374
},
{
"epoch": 3.4094903339191562,
"grad_norm": 0.38638436375125973,
"learning_rate": 2.4382024803137396e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2929654121398926,
"step": 1940,
"valid_targets_mean": 7747.4,
"valid_targets_min": 6818
},
{
"epoch": 3.4182776801405974,
"grad_norm": 0.3953451484079772,
"learning_rate": 2.429645680011733e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.302202969789505,
"step": 1945,
"valid_targets_mean": 8351.3,
"valid_targets_min": 6862
},
{
"epoch": 3.4270650263620386,
"grad_norm": 0.3751593823197104,
"learning_rate": 2.4210806266781594e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3071412146091461,
"step": 1950,
"valid_targets_mean": 7740.3,
"valid_targets_min": 6935
},
{
"epoch": 3.4358523725834798,
"grad_norm": 0.36196563194913356,
"learning_rate": 2.412507484838482e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2920036315917969,
"step": 1955,
"valid_targets_mean": 7653.2,
"valid_targets_min": 6818
},
{
"epoch": 3.444639718804921,
"grad_norm": 0.37091777373640833,
"learning_rate": 2.4039264191735395e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2962215542793274,
"step": 1960,
"valid_targets_mean": 7831.8,
"valid_targets_min": 6595
},
{
"epoch": 3.453427065026362,
"grad_norm": 0.390591605400152,
"learning_rate": 2.395337594516377e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2922114133834839,
"step": 1965,
"valid_targets_mean": 7379.8,
"valid_targets_min": 697
},
{
"epoch": 3.4622144112478033,
"grad_norm": 0.369413337310835,
"learning_rate": 2.3867411758490816e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982785403728485,
"step": 1970,
"valid_targets_mean": 7606.5,
"valid_targets_min": 4247
},
{
"epoch": 3.4710017574692444,
"grad_norm": 0.405455002612328,
"learning_rate": 2.378137328299613e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30318358540534973,
"step": 1975,
"valid_targets_mean": 7526.5,
"valid_targets_min": 7074
},
{
"epoch": 3.4797891036906856,
"grad_norm": 0.3634587702657081,
"learning_rate": 2.3695262171386318e-05,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018918037414551,
"step": 1980,
"valid_targets_mean": 7679.5,
"valid_targets_min": 6946
},
{
"epoch": 3.4885764499121263,
"grad_norm": 0.34154368112209427,
"learning_rate": 2.3609080077763258e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2998007535934448,
"step": 1985,
"valid_targets_mean": 8390.5,
"valid_targets_min": 7163
},
{
"epoch": 3.4973637961335675,
"grad_norm": 0.3511764990003454,
"learning_rate": 2.3522828657592295e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29999998211860657,
"step": 1990,
"valid_targets_mean": 7749.6,
"valid_targets_min": 6803
},
{
"epoch": 3.5061511423550087,
"grad_norm": 0.34837512795153164,
"learning_rate": 2.3436509567670483e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29551586508750916,
"step": 1995,
"valid_targets_mean": 8445.1,
"valid_targets_min": 6882
},
{
"epoch": 3.51493848857645,
"grad_norm": 0.3593792510717582,
"learning_rate": 2.335012446609473e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29875677824020386,
"step": 2000,
"valid_targets_mean": 7767.0,
"valid_targets_min": 6766
},
{
"epoch": 3.523725834797891,
"grad_norm": 0.34649869648554,
"learning_rate": 2.326367501222996e-05,
"loss": 0.3018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3036854565143585,
"step": 2005,
"valid_targets_mean": 7762.8,
"valid_targets_min": 7027
},
{
"epoch": 3.532513181019332,
"grad_norm": 0.3444149291424148,
"learning_rate": 2.317716286667723e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.285929799079895,
"step": 2010,
"valid_targets_mean": 8649.1,
"valid_targets_min": 7412
},
{
"epoch": 3.5413005272407734,
"grad_norm": 0.3626950990864704,
"learning_rate": 2.3090589691241842e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122712969779968,
"step": 2015,
"valid_targets_mean": 8208.6,
"valid_targets_min": 7202
},
{
"epoch": 3.5500878734622145,
"grad_norm": 0.40986706588615096,
"learning_rate": 2.300395714890142e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29588234424591064,
"step": 2020,
"valid_targets_mean": 8427.4,
"valid_targets_min": 6603
},
{
"epoch": 3.5588752196836557,
"grad_norm": 0.44018019011979087,
"learning_rate": 2.291726690377394e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2984328866004944,
"step": 2025,
"valid_targets_mean": 7692.3,
"valid_targets_min": 4237
},
{
"epoch": 3.5676625659050965,
"grad_norm": 0.33525487653600955,
"learning_rate": 2.283052062108582e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910841107368469,
"step": 2030,
"valid_targets_mean": 7992.1,
"valid_targets_min": 843
},
{
"epoch": 3.5764499121265376,
"grad_norm": 0.41470532934154464,
"learning_rate": 2.2743719967139884e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30168616771698,
"step": 2035,
"valid_targets_mean": 7738.9,
"valid_targets_min": 6976
},
{
"epoch": 3.585237258347979,
"grad_norm": 0.3816942129631596,
"learning_rate": 2.265686660928336e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30841612815856934,
"step": 2040,
"valid_targets_mean": 7594.2,
"valid_targets_min": 6528
},
{
"epoch": 3.59402460456942,
"grad_norm": 0.3922269375009551,
"learning_rate": 2.2569962215875866e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996993064880371,
"step": 2045,
"valid_targets_mean": 7590.4,
"valid_targets_min": 6690
},
{
"epoch": 3.602811950790861,
"grad_norm": 0.3980707323221537,
"learning_rate": 2.248300845625737e-05,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303586483001709,
"step": 2050,
"valid_targets_mean": 7318.8,
"valid_targets_min": 735
},
{
"epoch": 3.6115992970123023,
"grad_norm": 0.3961947116955539,
"learning_rate": 2.2396007000716105e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29648107290267944,
"step": 2055,
"valid_targets_mean": 7136.8,
"valid_targets_min": 637
},
{
"epoch": 3.6203866432337435,
"grad_norm": 0.3702084207366189,
"learning_rate": 2.2308959520456485e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2861528992652893,
"step": 2060,
"valid_targets_mean": 7680.1,
"valid_targets_min": 7175
},
{
"epoch": 3.6291739894551847,
"grad_norm": 0.3562202580176658,
"learning_rate": 2.2221867687567012e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2883298993110657,
"step": 2065,
"valid_targets_mean": 7557.6,
"valid_targets_min": 6670
},
{
"epoch": 3.637961335676626,
"grad_norm": 0.34916487177672517,
"learning_rate": 2.2134733174988164e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3074985146522522,
"step": 2070,
"valid_targets_mean": 7415.9,
"valid_targets_min": 5588
},
{
"epoch": 3.6467486818980666,
"grad_norm": 0.328771161047517,
"learning_rate": 2.204755765648024e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930622100830078,
"step": 2075,
"valid_targets_mean": 8362.1,
"valid_targets_min": 6188
},
{
"epoch": 3.655536028119508,
"grad_norm": 0.32265693739853746,
"learning_rate": 2.196034280659122e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2902243733406067,
"step": 2080,
"valid_targets_mean": 8383.9,
"valid_targets_min": 1832
},
{
"epoch": 3.664323374340949,
"grad_norm": 0.34293162883651207,
"learning_rate": 2.187309030062459e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29204216599464417,
"step": 2085,
"valid_targets_mean": 7703.4,
"valid_targets_min": 6982
},
{
"epoch": 3.67311072056239,
"grad_norm": 0.368430645097028,
"learning_rate": 2.17858018146072e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30315840244293213,
"step": 2090,
"valid_targets_mean": 7791.8,
"valid_targets_min": 6947
},
{
"epoch": 3.6818980667838312,
"grad_norm": 0.36604149908644223,
"learning_rate": 2.1698479025256996e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2964887022972107,
"step": 2095,
"valid_targets_mean": 7566.7,
"valid_targets_min": 7005
},
{
"epoch": 3.6906854130052724,
"grad_norm": 0.3479378144053659,
"learning_rate": 2.1611123609950885e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27931052446365356,
"step": 2100,
"valid_targets_mean": 7593.7,
"valid_targets_min": 6713
},
{
"epoch": 3.6994727592267136,
"grad_norm": 0.3561427535078435,
"learning_rate": 2.1523737246692467e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2985917925834656,
"step": 2105,
"valid_targets_mean": 7797.1,
"valid_targets_min": 6688
},
{
"epoch": 3.7082601054481548,
"grad_norm": 0.34500911426625497,
"learning_rate": 2.1436321614079833e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996689975261688,
"step": 2110,
"valid_targets_mean": 7744.1,
"valid_targets_min": 6637
},
{
"epoch": 3.717047451669596,
"grad_norm": 0.35773921165040784,
"learning_rate": 2.134887839127328e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833252251148224,
"step": 2115,
"valid_targets_mean": 7583.2,
"valid_targets_min": 6776
},
{
"epoch": 3.7258347978910367,
"grad_norm": 0.3553759973101524,
"learning_rate": 2.1261409257963122e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27806031703948975,
"step": 2120,
"valid_targets_mean": 7864.3,
"valid_targets_min": 6850
},
{
"epoch": 3.7346221441124783,
"grad_norm": 0.34050580593703944,
"learning_rate": 2.1173915894337357e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3134038746356964,
"step": 2125,
"valid_targets_mean": 8492.7,
"valid_targets_min": 685
},
{
"epoch": 3.743409490333919,
"grad_norm": 0.34663435278517646,
"learning_rate": 2.1086399981049422e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2960328757762909,
"step": 2130,
"valid_targets_mean": 8056.3,
"valid_targets_min": 7053
},
{
"epoch": 3.75219683655536,
"grad_norm": 0.3460448048393109,
"learning_rate": 2.0998863199185925e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29417964816093445,
"step": 2135,
"valid_targets_mean": 7704.6,
"valid_targets_min": 6840
},
{
"epoch": 3.7609841827768014,
"grad_norm": 0.3597630093679228,
"learning_rate": 2.0911307230234326e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29962360858917236,
"step": 2140,
"valid_targets_mean": 8447.3,
"valid_targets_min": 7102
},
{
"epoch": 3.7697715289982425,
"grad_norm": 0.3472767049797148,
"learning_rate": 2.0823733756050654e-05,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956916093826294,
"step": 2145,
"valid_targets_mean": 8690.3,
"valid_targets_min": 6901
},
{
"epoch": 3.7785588752196837,
"grad_norm": 0.3467387362608841,
"learning_rate": 2.073614445882718e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29842609167099,
"step": 2150,
"valid_targets_mean": 8387.1,
"valid_targets_min": 7325
},
{
"epoch": 3.787346221441125,
"grad_norm": 0.33445920251252786,
"learning_rate": 2.064854102106014e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935226261615753,
"step": 2155,
"valid_targets_mean": 7921.4,
"valid_targets_min": 5375
},
{
"epoch": 3.796133567662566,
"grad_norm": 0.40128928390340646,
"learning_rate": 2.056092512551738e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3062954843044281,
"step": 2160,
"valid_targets_mean": 7697.6,
"valid_targets_min": 6973
},
{
"epoch": 3.8049209138840068,
"grad_norm": 0.3338208595633261,
"learning_rate": 2.0473298455206057e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3123404383659363,
"step": 2165,
"valid_targets_mean": 10194.6,
"valid_targets_min": 7270
},
{
"epoch": 3.8137082601054484,
"grad_norm": 0.36818192579005726,
"learning_rate": 2.0385662693340286e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.312699556350708,
"step": 2170,
"valid_targets_mean": 8341.1,
"valid_targets_min": 6541
},
{
"epoch": 3.822495606326889,
"grad_norm": 0.38235082701821926,
"learning_rate": 2.0298019523308827e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2968581020832062,
"step": 2175,
"valid_targets_mean": 7806.9,
"valid_targets_min": 6590
},
{
"epoch": 3.8312829525483303,
"grad_norm": 0.35616734722609394,
"learning_rate": 2.0210370628642758e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092958927154541,
"step": 2180,
"valid_targets_mean": 8949.9,
"valid_targets_min": 6994
},
{
"epoch": 3.8400702987697715,
"grad_norm": 0.36230882317460195,
"learning_rate": 2.0122717692983095e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30545303225517273,
"step": 2185,
"valid_targets_mean": 8836.3,
"valid_targets_min": 7478
},
{
"epoch": 3.8488576449912126,
"grad_norm": 0.369585223854352,
"learning_rate": 2.0035062400048487e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29880499839782715,
"step": 2190,
"valid_targets_mean": 7757.9,
"valid_targets_min": 7021
},
{
"epoch": 3.857644991212654,
"grad_norm": 0.355006341475912,
"learning_rate": 1.9947406433602875e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3043487071990967,
"step": 2195,
"valid_targets_mean": 8424.7,
"valid_targets_min": 7119
},
{
"epoch": 3.866432337434095,
"grad_norm": 0.35860000458499863,
"learning_rate": 1.985975147742313e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29896068572998047,
"step": 2200,
"valid_targets_mean": 7631.4,
"valid_targets_min": 6526
},
{
"epoch": 3.875219683655536,
"grad_norm": 0.3595590287255001,
"learning_rate": 1.9772099215266716e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3074376583099365,
"step": 2205,
"valid_targets_mean": 8199.1,
"valid_targets_min": 6673
},
{
"epoch": 3.884007029876977,
"grad_norm": 0.3337123618202419,
"learning_rate": 1.9684451330839336e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3159179091453552,
"step": 2210,
"valid_targets_mean": 8646.1,
"valid_targets_min": 7196
},
{
"epoch": 3.8927943760984185,
"grad_norm": 0.3375866724477434,
"learning_rate": 1.959680950776262e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30195510387420654,
"step": 2215,
"valid_targets_mean": 8551.9,
"valid_targets_min": 6344
},
{
"epoch": 3.9015817223198592,
"grad_norm": 0.3917560295159304,
"learning_rate": 1.950917542954176e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983649671077728,
"step": 2220,
"valid_targets_mean": 8389.0,
"valid_targets_min": 6800
},
{
"epoch": 3.9103690685413004,
"grad_norm": 0.32762131645955955,
"learning_rate": 1.9421550779533173e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28323426842689514,
"step": 2225,
"valid_targets_mean": 7616.5,
"valid_targets_min": 7052
},
{
"epoch": 3.9191564147627416,
"grad_norm": 0.3590043216289149,
"learning_rate": 1.933393724091218e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2843273878097534,
"step": 2230,
"valid_targets_mean": 7437.1,
"valid_targets_min": 6760
},
{
"epoch": 3.9279437609841827,
"grad_norm": 0.3377129248179601,
"learning_rate": 1.924633649664065e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3038652539253235,
"step": 2235,
"valid_targets_mean": 7922.2,
"valid_targets_min": 6763
},
{
"epoch": 3.936731107205624,
"grad_norm": 0.3795385389616872,
"learning_rate": 1.9158750229434703e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3075161576271057,
"step": 2240,
"valid_targets_mean": 7685.2,
"valid_targets_min": 6322
},
{
"epoch": 3.945518453427065,
"grad_norm": 0.34801917030646934,
"learning_rate": 1.9071180121732356e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30163663625717163,
"step": 2245,
"valid_targets_mean": 7734.0,
"valid_targets_min": 5781
},
{
"epoch": 3.9543057996485063,
"grad_norm": 0.3710316888949028,
"learning_rate": 1.898362785566122e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2933363914489746,
"step": 2250,
"valid_targets_mean": 7705.3,
"valid_targets_min": 7006
},
{
"epoch": 3.9630931458699474,
"grad_norm": 0.36369463382133627,
"learning_rate": 1.8896095113006203e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916035056114197,
"step": 2255,
"valid_targets_mean": 7839.6,
"valid_targets_min": 7064
},
{
"epoch": 3.9718804920913886,
"grad_norm": 0.3602525091263,
"learning_rate": 1.8808583575177172e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2959211468696594,
"step": 2260,
"valid_targets_mean": 7561.2,
"valid_targets_min": 6388
},
{
"epoch": 3.9806678383128293,
"grad_norm": 0.3915867253300481,
"learning_rate": 1.8721094923176676e-05,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.294384241104126,
"step": 2265,
"valid_targets_mean": 7656.9,
"valid_targets_min": 7114
},
{
"epoch": 3.9894551845342705,
"grad_norm": 0.33401393363437887,
"learning_rate": 1.863363083756766e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978602647781372,
"step": 2270,
"valid_targets_mean": 7726.6,
"valid_targets_min": 5183
},
{
"epoch": 3.9982425307557117,
"grad_norm": 0.3565162475058981,
"learning_rate": 1.854619299844117e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30783626437187195,
"step": 2275,
"valid_targets_mean": 7563.9,
"valid_targets_min": 6744
},
{
"epoch": 4.007029876977153,
"grad_norm": 0.3605847836372147,
"learning_rate": 1.845878308538408e-05,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2928239107131958,
"step": 2280,
"valid_targets_mean": 7678.9,
"valid_targets_min": 6670
},
{
"epoch": 4.015817223198594,
"grad_norm": 0.3622677156022337,
"learning_rate": 1.8371402777446833e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29661375284194946,
"step": 2285,
"valid_targets_mean": 7731.3,
"valid_targets_min": 6753
},
{
"epoch": 4.024604569420035,
"grad_norm": 0.3476786557845217,
"learning_rate": 1.8284053753111205e-05,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29199156165122986,
"step": 2290,
"valid_targets_mean": 8399.1,
"valid_targets_min": 6665
},
{
"epoch": 4.033391915641476,
"grad_norm": 0.36611453493835344,
"learning_rate": 1.8196737690258034e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935590147972107,
"step": 2295,
"valid_targets_mean": 7679.2,
"valid_targets_min": 5811
},
{
"epoch": 4.042179261862917,
"grad_norm": 0.3691938793291058,
"learning_rate": 1.810945626613501e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29997485876083374,
"step": 2300,
"valid_targets_mean": 7750.9,
"valid_targets_min": 6803
},
{
"epoch": 4.050966608084359,
"grad_norm": 0.31535572991582766,
"learning_rate": 1.8022211157324446e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30525609850883484,
"step": 2305,
"valid_targets_mean": 9915.7,
"valid_targets_min": 6960
},
{
"epoch": 4.059753954305799,
"grad_norm": 0.312524298994893,
"learning_rate": 1.7935004039711078e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303733229637146,
"step": 2310,
"valid_targets_mean": 8488.7,
"valid_targets_min": 709
},
{
"epoch": 4.068541300527241,
"grad_norm": 0.3380666197036135,
"learning_rate": 1.7847836588449873e-05,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29684263467788696,
"step": 2315,
"valid_targets_mean": 7753.6,
"valid_targets_min": 6947
},
{
"epoch": 4.077328646748682,
"grad_norm": 0.3491856380684149,
"learning_rate": 1.7760710477933846e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.296021044254303,
"step": 2320,
"valid_targets_mean": 8416.9,
"valid_targets_min": 6714
},
{
"epoch": 4.086115992970123,
"grad_norm": 0.3377305735422485,
"learning_rate": 1.7673627381761907e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2817150056362152,
"step": 2325,
"valid_targets_mean": 8393.1,
"valid_targets_min": 6642
},
{
"epoch": 4.094903339191564,
"grad_norm": 0.3585848827276999,
"learning_rate": 1.7586588972706703e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930801510810852,
"step": 2330,
"valid_targets_mean": 7160.6,
"valid_targets_min": 787
},
{
"epoch": 4.103690685413005,
"grad_norm": 0.3369104092071973,
"learning_rate": 1.749959692268249e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29731500148773193,
"step": 2335,
"valid_targets_mean": 8363.5,
"valid_targets_min": 6850
},
{
"epoch": 4.1124780316344465,
"grad_norm": 0.3539275994219718,
"learning_rate": 1.741265290271302e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28852784633636475,
"step": 2340,
"valid_targets_mean": 7780.0,
"valid_targets_min": 7083
},
{
"epoch": 4.121265377855887,
"grad_norm": 0.3607445678030254,
"learning_rate": 1.7325758582899442e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3095434010028839,
"step": 2345,
"valid_targets_mean": 7643.3,
"valid_targets_min": 6791
},
{
"epoch": 4.130052724077329,
"grad_norm": 0.3961086551803289,
"learning_rate": 1.7238915632388198e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3048168420791626,
"step": 2350,
"valid_targets_mean": 7675.9,
"valid_targets_min": 6670
},
{
"epoch": 4.1388400702987695,
"grad_norm": 0.3293769346899659,
"learning_rate": 1.7152125719339e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010752201080322,
"step": 2355,
"valid_targets_mean": 9228.5,
"valid_targets_min": 6075
},
{
"epoch": 4.147627416520211,
"grad_norm": 0.35490134598296946,
"learning_rate": 1.7065390510892767e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289789080619812,
"step": 2360,
"valid_targets_mean": 7724.8,
"valid_targets_min": 6916
},
{
"epoch": 4.156414762741652,
"grad_norm": 0.35645129004789955,
"learning_rate": 1.69787116731396e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2860274314880371,
"step": 2365,
"valid_targets_mean": 7424.2,
"valid_targets_min": 3281
},
{
"epoch": 4.1652021089630935,
"grad_norm": 0.36641430970748606,
"learning_rate": 1.6892090871086772e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29338160157203674,
"step": 2370,
"valid_targets_mean": 7637.6,
"valid_targets_min": 7054
},
{
"epoch": 4.173989455184534,
"grad_norm": 0.3582363581783471,
"learning_rate": 1.680552976862676e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29446232318878174,
"step": 2375,
"valid_targets_mean": 7540.2,
"valid_targets_min": 6573
},
{
"epoch": 4.182776801405975,
"grad_norm": 0.3343312433323364,
"learning_rate": 1.671903002850528e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29724544286727905,
"step": 2380,
"valid_targets_mean": 7826.4,
"valid_targets_min": 7064
},
{
"epoch": 4.191564147627417,
"grad_norm": 0.34146365708841836,
"learning_rate": 1.6632593312289326e-05,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28881704807281494,
"step": 2385,
"valid_targets_mean": 8713.6,
"valid_targets_min": 7182
},
{
"epoch": 4.200351493848857,
"grad_norm": 0.3793519885366359,
"learning_rate": 1.6546221280335283e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3088436424732208,
"step": 2390,
"valid_targets_mean": 7500.3,
"valid_targets_min": 6973
},
{
"epoch": 4.209138840070299,
"grad_norm": 0.3261860918301623,
"learning_rate": 1.6459915591757026e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2880277633666992,
"step": 2395,
"valid_targets_mean": 8629.6,
"valid_targets_min": 6451
},
{
"epoch": 4.21792618629174,
"grad_norm": 0.33627803896949293,
"learning_rate": 1.6373677904394038e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29634952545166016,
"step": 2400,
"valid_targets_mean": 8985.0,
"valid_targets_min": 6850
},
{
"epoch": 4.226713532513181,
"grad_norm": 0.35027190738818986,
"learning_rate": 1.628750987477957e-05,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28951579332351685,
"step": 2405,
"valid_targets_mean": 7849.4,
"valid_targets_min": 7153
},
{
"epoch": 4.235500878734622,
"grad_norm": 0.3371494119478246,
"learning_rate": 1.6201413158108823e-05,
"loss": 0.2993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29981040954589844,
"step": 2410,
"valid_targets_mean": 7603.4,
"valid_targets_min": 6746
},
{
"epoch": 4.244288224956064,
"grad_norm": 0.32995317258621537,
"learning_rate": 1.6115389408207168e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904054522514343,
"step": 2415,
"valid_targets_mean": 8291.9,
"valid_targets_min": 6637
},
{
"epoch": 4.253075571177504,
"grad_norm": 0.3609691770401668,
"learning_rate": 1.6029440277498333e-05,
"loss": 0.2971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953414022922516,
"step": 2420,
"valid_targets_mean": 7441.1,
"valid_targets_min": 4269
},
{
"epoch": 4.261862917398945,
"grad_norm": 0.34173193821882997,
"learning_rate": 1.594356741697271e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966964840888977,
"step": 2425,
"valid_targets_mean": 8248.4,
"valid_targets_min": 3803
},
{
"epoch": 4.270650263620387,
"grad_norm": 0.37725438835202146,
"learning_rate": 1.5857772476155634e-05,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29200655221939087,
"step": 2430,
"valid_targets_mean": 7750.5,
"valid_targets_min": 6770
},
{
"epoch": 4.279437609841827,
"grad_norm": 0.3496762203635566,
"learning_rate": 1.577205710307566e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2777150869369507,
"step": 2435,
"valid_targets_mean": 7676.3,
"valid_targets_min": 7223
},
{
"epoch": 4.288224956063269,
"grad_norm": 0.3885029388879682,
"learning_rate": 1.5686422944232952e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29064977169036865,
"step": 2440,
"valid_targets_mean": 7624.4,
"valid_targets_min": 6504
},
{
"epoch": 4.29701230228471,
"grad_norm": 0.34950891257387595,
"learning_rate": 1.5600871644567633e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3030955493450165,
"step": 2445,
"valid_targets_mean": 8336.4,
"valid_targets_min": 7183
},
{
"epoch": 4.305799648506151,
"grad_norm": 0.3758714793081841,
"learning_rate": 1.5515404847428185e-05,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3020630478858948,
"step": 2450,
"valid_targets_mean": 7686.5,
"valid_targets_min": 6825
},
{
"epoch": 4.314586994727592,
"grad_norm": 0.3640031717897144,
"learning_rate": 1.5430024194539882e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2913421392440796,
"step": 2455,
"valid_targets_mean": 8199.2,
"valid_targets_min": 6796
},
{
"epoch": 4.323374340949034,
"grad_norm": 0.34866882466970534,
"learning_rate": 1.534473132597327e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2923296093940735,
"step": 2460,
"valid_targets_mean": 7538.4,
"valid_targets_min": 6140
},
{
"epoch": 4.3321616871704745,
"grad_norm": 0.33398689156760114,
"learning_rate": 1.5259527880112656e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966546416282654,
"step": 2465,
"valid_targets_mean": 7731.1,
"valid_targets_min": 6753
},
{
"epoch": 4.340949033391915,
"grad_norm": 0.3911676097472629,
"learning_rate": 1.5174415493624621e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30364346504211426,
"step": 2470,
"valid_targets_mean": 7488.8,
"valid_targets_min": 6749
},
{
"epoch": 4.349736379613357,
"grad_norm": 0.36769878489272523,
"learning_rate": 1.5089395801426596e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28855615854263306,
"step": 2475,
"valid_targets_mean": 7546.9,
"valid_targets_min": 6861
},
{
"epoch": 4.3585237258347975,
"grad_norm": 0.3412416489679569,
"learning_rate": 1.500447043665546e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983751893043518,
"step": 2480,
"valid_targets_mean": 8474.9,
"valid_targets_min": 5952
},
{
"epoch": 4.367311072056239,
"grad_norm": 0.33005482718780915,
"learning_rate": 1.4919641030636171e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833927869796753,
"step": 2485,
"valid_targets_mean": 8681.6,
"valid_targets_min": 7316
},
{
"epoch": 4.37609841827768,
"grad_norm": 0.3533106228979608,
"learning_rate": 1.4834909212850393e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28979846835136414,
"step": 2490,
"valid_targets_mean": 7579.9,
"valid_targets_min": 6740
},
{
"epoch": 4.3848857644991215,
"grad_norm": 0.3399076207790794,
"learning_rate": 1.475027661090525e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28529787063598633,
"step": 2495,
"valid_targets_mean": 7799.6,
"valid_targets_min": 7114
},
{
"epoch": 4.393673110720562,
"grad_norm": 0.312265946283216,
"learning_rate": 1.4665744850502035e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2880713641643524,
"step": 2500,
"valid_targets_mean": 8861.7,
"valid_targets_min": 6847
},
{
"epoch": 4.402460456942004,
"grad_norm": 0.3634215352563139,
"learning_rate": 1.4581315555404975e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29981136322021484,
"step": 2505,
"valid_targets_mean": 7694.9,
"valid_targets_min": 6288
},
{
"epoch": 4.411247803163445,
"grad_norm": 0.33381823311042097,
"learning_rate": 1.4496990347410056e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3036734461784363,
"step": 2510,
"valid_targets_mean": 8840.7,
"valid_targets_min": 7064
},
{
"epoch": 4.420035149384886,
"grad_norm": 0.3609301558527897,
"learning_rate": 1.4412770846313857e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2926355004310608,
"step": 2515,
"valid_targets_mean": 7695.9,
"valid_targets_min": 6847
},
{
"epoch": 4.428822495606327,
"grad_norm": 0.34936926923864897,
"learning_rate": 1.432865866988245e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30009007453918457,
"step": 2520,
"valid_targets_mean": 8763.0,
"valid_targets_min": 7017
},
{
"epoch": 4.437609841827768,
"grad_norm": 0.36541173520341647,
"learning_rate": 1.4244655433820294e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28389137983322144,
"step": 2525,
"valid_targets_mean": 7828.1,
"valid_targets_min": 7234
},
{
"epoch": 4.446397188049209,
"grad_norm": 0.3235817236180097,
"learning_rate": 1.4160762751739245e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28554970026016235,
"step": 2530,
"valid_targets_mean": 8569.7,
"valid_targets_min": 6711
},
{
"epoch": 4.45518453427065,
"grad_norm": 0.37288004350052983,
"learning_rate": 1.4076982235127523e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2974032759666443,
"step": 2535,
"valid_targets_mean": 7637.2,
"valid_targets_min": 6968
},
{
"epoch": 4.463971880492092,
"grad_norm": 0.36992647709739473,
"learning_rate": 1.399331549331878e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29612836241722107,
"step": 2540,
"valid_targets_mean": 7321.6,
"valid_targets_min": 791
},
{
"epoch": 4.472759226713532,
"grad_norm": 0.36203015252759363,
"learning_rate": 1.390976413346116e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28595858812332153,
"step": 2545,
"valid_targets_mean": 9075.9,
"valid_targets_min": 7270
},
{
"epoch": 4.481546572934974,
"grad_norm": 0.3399703611080894,
"learning_rate": 1.3826329760486462e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931751608848572,
"step": 2550,
"valid_targets_mean": 7748.2,
"valid_targets_min": 7333
},
{
"epoch": 4.490333919156415,
"grad_norm": 0.3620118102981346,
"learning_rate": 1.3743013977079289e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2936304807662964,
"step": 2555,
"valid_targets_mean": 8341.4,
"valid_targets_min": 6909
},
{
"epoch": 4.499121265377856,
"grad_norm": 0.33151273542929843,
"learning_rate": 1.3659818383646242e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2981259524822235,
"step": 2560,
"valid_targets_mean": 7763.2,
"valid_targets_min": 7005
},
{
"epoch": 4.507908611599297,
"grad_norm": 0.3408783337428309,
"learning_rate": 1.3576744578285235e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30304306745529175,
"step": 2565,
"valid_targets_mean": 7672.8,
"valid_targets_min": 7217
},
{
"epoch": 4.516695957820739,
"grad_norm": 0.34010772862058963,
"learning_rate": 1.3493794156754744e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2977759540081024,
"step": 2570,
"valid_targets_mean": 7593.9,
"valid_targets_min": 6016
},
{
"epoch": 4.525483304042179,
"grad_norm": 0.34600139704727106,
"learning_rate": 1.3410968712443185e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2835003137588501,
"step": 2575,
"valid_targets_mean": 8259.8,
"valid_targets_min": 7135
},
{
"epoch": 4.53427065026362,
"grad_norm": 0.38063980661062224,
"learning_rate": 1.3328269836338285e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2990835905075073,
"step": 2580,
"valid_targets_mean": 7738.0,
"valid_targets_min": 7072
},
{
"epoch": 4.543057996485062,
"grad_norm": 0.3383400317506876,
"learning_rate": 1.3245699116996546e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2957487404346466,
"step": 2585,
"valid_targets_mean": 7810.8,
"valid_targets_min": 7374
},
{
"epoch": 4.551845342706502,
"grad_norm": 0.3411469261818419,
"learning_rate": 1.316325814051271e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2963276505470276,
"step": 2590,
"valid_targets_mean": 8551.5,
"valid_targets_min": 6880
},
{
"epoch": 4.560632688927944,
"grad_norm": 0.36267221964327634,
"learning_rate": 1.3080948490489282e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2887016534805298,
"step": 2595,
"valid_targets_mean": 7742.6,
"valid_targets_min": 6916
},
{
"epoch": 4.569420035149385,
"grad_norm": 0.3192342527402402,
"learning_rate": 1.2998771748006153e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999793589115143,
"step": 2600,
"valid_targets_mean": 9242.8,
"valid_targets_min": 6875
},
{
"epoch": 4.578207381370826,
"grad_norm": 0.35210138034589905,
"learning_rate": 1.2916729491590191e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29489219188690186,
"step": 2605,
"valid_targets_mean": 7644.7,
"valid_targets_min": 6891
},
{
"epoch": 4.586994727592267,
"grad_norm": 0.35250185727295646,
"learning_rate": 1.2834823297184932e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3076801300048828,
"step": 2610,
"valid_targets_mean": 7650.2,
"valid_targets_min": 6787
},
{
"epoch": 4.595782073813709,
"grad_norm": 0.3588600288438206,
"learning_rate": 1.2753054738120303e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28878769278526306,
"step": 2615,
"valid_targets_mean": 7817.5,
"valid_targets_min": 7146
},
{
"epoch": 4.6045694200351495,
"grad_norm": 0.34081363508124407,
"learning_rate": 1.267142538508241e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886558771133423,
"step": 2620,
"valid_targets_mean": 7755.6,
"valid_targets_min": 6890
},
{
"epoch": 4.61335676625659,
"grad_norm": 0.3562288164925693,
"learning_rate": 1.258993680608337e-05,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29327595233917236,
"step": 2625,
"valid_targets_mean": 7758.2,
"valid_targets_min": 6882
},
{
"epoch": 4.622144112478032,
"grad_norm": 0.35026490484322587,
"learning_rate": 1.2508590566431149e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29490119218826294,
"step": 2630,
"valid_targets_mean": 7648.2,
"valid_targets_min": 7020
},
{
"epoch": 4.6309314586994725,
"grad_norm": 0.3358053567829388,
"learning_rate": 1.2427388228699561e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2979782223701477,
"step": 2635,
"valid_targets_mean": 7701.8,
"valid_targets_min": 7259
},
{
"epoch": 4.639718804920914,
"grad_norm": 0.34062942673912844,
"learning_rate": 1.2346331352698206e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931850850582123,
"step": 2640,
"valid_targets_mean": 7778.1,
"valid_targets_min": 6715
},
{
"epoch": 4.648506151142355,
"grad_norm": 0.3432994977430127,
"learning_rate": 1.2265421495442524e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29120543599128723,
"step": 2645,
"valid_targets_mean": 7699.0,
"valid_targets_min": 6975
},
{
"epoch": 4.6572934973637965,
"grad_norm": 0.3234100940050823,
"learning_rate": 1.2184660211123878e-05,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2826187014579773,
"step": 2650,
"valid_targets_mean": 8331.6,
"valid_targets_min": 2881
},
{
"epoch": 4.666080843585237,
"grad_norm": 0.3376680880965843,
"learning_rate": 1.2104049051079706e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29047930240631104,
"step": 2655,
"valid_targets_mean": 7689.2,
"valid_targets_min": 6146
},
{
"epoch": 4.674868189806679,
"grad_norm": 0.33738468635114716,
"learning_rate": 1.2023589563763731e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29389703273773193,
"step": 2660,
"valid_targets_mean": 8689.8,
"valid_targets_min": 7342
},
{
"epoch": 4.68365553602812,
"grad_norm": 0.34363822100044406,
"learning_rate": 1.1943283294716181e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29355084896087646,
"step": 2665,
"valid_targets_mean": 7720.2,
"valid_targets_min": 6622
},
{
"epoch": 4.69244288224956,
"grad_norm": 0.3353093732478869,
"learning_rate": 1.1863131786534146e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2888862192630768,
"step": 2670,
"valid_targets_mean": 7782.6,
"valid_targets_min": 7169
},
{
"epoch": 4.701230228471002,
"grad_norm": 0.37334062851684074,
"learning_rate": 1.1783136578841926e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29228097200393677,
"step": 2675,
"valid_targets_mean": 7612.3,
"valid_targets_min": 6837
},
{
"epoch": 4.710017574692443,
"grad_norm": 0.3310503918639298,
"learning_rate": 1.1703299208261447e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2942769229412079,
"step": 2680,
"valid_targets_mean": 7763.1,
"valid_targets_min": 6840
},
{
"epoch": 4.718804920913884,
"grad_norm": 0.3395372943848242,
"learning_rate": 1.1623621208382759e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2782164514064789,
"step": 2685,
"valid_targets_mean": 7669.9,
"valid_targets_min": 7123
},
{
"epoch": 4.727592267135325,
"grad_norm": 0.3804812360317412,
"learning_rate": 1.1544104109734578e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29553931951522827,
"step": 2690,
"valid_targets_mean": 7181.2,
"valid_targets_min": 919
},
{
"epoch": 4.736379613356767,
"grad_norm": 0.3311195492100797,
"learning_rate": 1.1464749439754872e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2889626622200012,
"step": 2695,
"valid_targets_mean": 7681.3,
"valid_targets_min": 7275
},
{
"epoch": 4.745166959578207,
"grad_norm": 0.36177414094290317,
"learning_rate": 1.1385558722761525e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815544009208679,
"step": 2700,
"valid_targets_mean": 7833.3,
"valid_targets_min": 6433
},
{
"epoch": 4.753954305799649,
"grad_norm": 0.36212081133708707,
"learning_rate": 1.1306533479923065e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29274970293045044,
"step": 2705,
"valid_targets_mean": 7638.4,
"valid_targets_min": 6999
},
{
"epoch": 4.76274165202109,
"grad_norm": 0.3462449009677967,
"learning_rate": 1.1227675229229453e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29539358615875244,
"step": 2710,
"valid_targets_mean": 7612.1,
"valid_targets_min": 6986
},
{
"epoch": 4.77152899824253,
"grad_norm": 0.3535258801165218,
"learning_rate": 1.1148985485462882e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30066198110580444,
"step": 2715,
"valid_targets_mean": 8542.9,
"valid_targets_min": 6921
},
{
"epoch": 4.780316344463972,
"grad_norm": 0.3343590007067174,
"learning_rate": 1.1070465760168746e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772175073623657,
"step": 2720,
"valid_targets_mean": 7717.8,
"valid_targets_min": 6688
},
{
"epoch": 4.789103690685413,
"grad_norm": 0.3298794655275155,
"learning_rate": 1.0992117561626521e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3084215521812439,
"step": 2725,
"valid_targets_mean": 7942.3,
"valid_targets_min": 7273
},
{
"epoch": 4.797891036906854,
"grad_norm": 0.35627041067347104,
"learning_rate": 1.0913942394820882e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3061642646789551,
"step": 2730,
"valid_targets_mean": 8432.6,
"valid_targets_min": 6496
},
{
"epoch": 4.806678383128295,
"grad_norm": 0.3442328956232023,
"learning_rate": 1.0835941761412725e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.299866646528244,
"step": 2735,
"valid_targets_mean": 7752.8,
"valid_targets_min": 6153
},
{
"epoch": 4.815465729349737,
"grad_norm": 0.3253332284940007,
"learning_rate": 1.0758117159710343e-05,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28083181381225586,
"step": 2740,
"valid_targets_mean": 8234.2,
"valid_targets_min": 6249
},
{
"epoch": 4.824253075571177,
"grad_norm": 0.33511730474947343,
"learning_rate": 1.0680470084640682e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2995944917201996,
"step": 2745,
"valid_targets_mean": 7667.0,
"valid_targets_min": 6791
},
{
"epoch": 4.833040421792619,
"grad_norm": 0.35583495623108913,
"learning_rate": 1.0603002027720544e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29249030351638794,
"step": 2750,
"valid_targets_mean": 7892.6,
"valid_targets_min": 7323
},
{
"epoch": 4.84182776801406,
"grad_norm": 0.32745370080185743,
"learning_rate": 1.0525714477028032e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2977753281593323,
"step": 2755,
"valid_targets_mean": 7558.4,
"valid_targets_min": 6979
},
{
"epoch": 4.8506151142355005,
"grad_norm": 0.3777877026804973,
"learning_rate": 1.044860891717388e-05,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29842567443847656,
"step": 2760,
"valid_targets_mean": 7716.7,
"valid_targets_min": 7014
},
{
"epoch": 4.859402460456942,
"grad_norm": 0.35088020099221523,
"learning_rate": 1.0371686829273015e-05,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2985210120677948,
"step": 2765,
"valid_targets_mean": 7565.1,
"valid_targets_min": 6922
},
{
"epoch": 4.868189806678383,
"grad_norm": 0.35904390189923535,
"learning_rate": 1.029494969091601e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2912167012691498,
"step": 2770,
"valid_targets_mean": 7680.2,
"valid_targets_min": 6763
},
{
"epoch": 4.8769771528998245,
"grad_norm": 0.33201225829312675,
"learning_rate": 1.0218398976140809e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27736738324165344,
"step": 2775,
"valid_targets_mean": 7764.4,
"valid_targets_min": 6648
},
{
"epoch": 4.885764499121265,
"grad_norm": 0.35091376493216436,
"learning_rate": 1.0142036155404322e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956676483154297,
"step": 2780,
"valid_targets_mean": 7626.8,
"valid_targets_min": 6490
},
{
"epoch": 4.894551845342707,
"grad_norm": 0.3452862859027685,
"learning_rate": 1.0065862695554248e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2862079441547394,
"step": 2785,
"valid_targets_mean": 7456.8,
"valid_targets_min": 6528
},
{
"epoch": 4.9033391915641475,
"grad_norm": 0.33774992294028156,
"learning_rate": 9.989880059800832e-06,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29728958010673523,
"step": 2790,
"valid_targets_mean": 7651.0,
"valid_targets_min": 7114
},
{
"epoch": 4.912126537785589,
"grad_norm": 0.317502819584272,
"learning_rate": 9.914089707688835e-06,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291983962059021,
"step": 2795,
"valid_targets_mean": 8589.1,
"valid_targets_min": 7083
},
{
"epoch": 4.92091388400703,
"grad_norm": 0.3201813183564017,
"learning_rate": 9.838493095069418e-06,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2711242735385895,
"step": 2800,
"valid_targets_mean": 8602.6,
"valid_targets_min": 6905
},
{
"epoch": 4.929701230228471,
"grad_norm": 0.3327302214786523,
"learning_rate": 9.763091674072225e-06,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2929172217845917,
"step": 2805,
"valid_targets_mean": 7599.5,
"valid_targets_min": 6065
},
{
"epoch": 4.938488576449912,
"grad_norm": 0.33452661554480145,
"learning_rate": 9.687886893077498e-06,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3053194284439087,
"step": 2810,
"valid_targets_mean": 7785.0,
"valid_targets_min": 6518
},
{
"epoch": 4.947275922671353,
"grad_norm": 0.35014091058387753,
"learning_rate": 9.612880196688207e-06,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884902358055115,
"step": 2815,
"valid_targets_mean": 8222.5,
"valid_targets_min": 6895
},
{
"epoch": 4.956063268892795,
"grad_norm": 0.32704238423920323,
"learning_rate": 9.538073025702361e-06,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2998591363430023,
"step": 2820,
"valid_targets_mean": 7775.8,
"valid_targets_min": 6685
},
{
"epoch": 4.964850615114235,
"grad_norm": 0.3298336299808867,
"learning_rate": 9.463466817085268e-06,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2903066575527191,
"step": 2825,
"valid_targets_mean": 8447.8,
"valid_targets_min": 6800
},
{
"epoch": 4.973637961335677,
"grad_norm": 0.3354261754806601,
"learning_rate": 9.389063003941991e-06,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.288758784532547,
"step": 2830,
"valid_targets_mean": 7734.7,
"valid_targets_min": 6344
},
{
"epoch": 4.982425307557118,
"grad_norm": 0.3143248716857657,
"learning_rate": 9.314863015489781e-06,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292439728975296,
"step": 2835,
"valid_targets_mean": 8252.8,
"valid_targets_min": 6557
},
{
"epoch": 4.991212653778559,
"grad_norm": 0.350198149823658,
"learning_rate": 9.240868277030637e-06,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28888189792633057,
"step": 2840,
"valid_targets_mean": 7591.3,
"valid_targets_min": 6767
},
{
"epoch": 5.0,
"grad_norm": 0.3433654464608369,
"learning_rate": 9.16708020992392e-06,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28854185342788696,
"step": 2845,
"valid_targets_mean": 7708.3,
"valid_targets_min": 6862
},
{
"epoch": 5.008787346221441,
"grad_norm": 0.35408106613717644,
"learning_rate": 9.093500231559076e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2872666120529175,
"step": 2850,
"valid_targets_mean": 7559.2,
"valid_targets_min": 6375
},
{
"epoch": 5.017574692442882,
"grad_norm": 0.34119774313343076,
"learning_rate": 9.020129755328369e-06,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759493291378021,
"step": 2855,
"valid_targets_mean": 8318.3,
"valid_targets_min": 6850
},
{
"epoch": 5.026362038664323,
"grad_norm": 0.3390569587906135,
"learning_rate": 8.94697019059977e-06,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29109516739845276,
"step": 2860,
"valid_targets_mean": 7784.2,
"valid_targets_min": 5826
},
{
"epoch": 5.035149384885765,
"grad_norm": 0.3143917948420686,
"learning_rate": 8.874022942689844e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29419422149658203,
"step": 2865,
"valid_targets_mean": 9353.3,
"valid_targets_min": 6895
},
{
"epoch": 5.043936731107205,
"grad_norm": 0.3510435013122092,
"learning_rate": 8.801289412836811e-06,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27901768684387207,
"step": 2870,
"valid_targets_mean": 7662.0,
"valid_targets_min": 6862
},
{
"epoch": 5.052724077328647,
"grad_norm": 0.3664757048422861,
"learning_rate": 8.728770998173567e-06,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3106905221939087,
"step": 2875,
"valid_targets_mean": 8406.5,
"valid_targets_min": 7211
},
{
"epoch": 5.061511423550088,
"grad_norm": 0.34806791171223833,
"learning_rate": 8.656469091700882e-06,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856566607952118,
"step": 2880,
"valid_targets_mean": 8157.8,
"valid_targets_min": 6785
},
{
"epoch": 5.070298769771529,
"grad_norm": 0.3530629680648787,
"learning_rate": 8.584385082260658e-06,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898819148540497,
"step": 2885,
"valid_targets_mean": 7758.8,
"valid_targets_min": 6637
},
{
"epoch": 5.07908611599297,
"grad_norm": 0.3289134833546327,
"learning_rate": 8.512520354509196e-06,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2844212055206299,
"step": 2890,
"valid_targets_mean": 8317.2,
"valid_targets_min": 6801
},
{
"epoch": 5.087873462214411,
"grad_norm": 0.3228881599417552,
"learning_rate": 8.440876288890663e-06,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3117586374282837,
"step": 2895,
"valid_targets_mean": 8214.1,
"valid_targets_min": 6788
},
{
"epoch": 5.0966608084358525,
"grad_norm": 0.35703463023856147,
"learning_rate": 8.369454261610516e-06,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3001853823661804,
"step": 2900,
"valid_targets_mean": 7620.3,
"valid_targets_min": 6337
},
{
"epoch": 5.105448154657293,
"grad_norm": 0.33663048411660607,
"learning_rate": 8.298255644609132e-06,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2892005443572998,
"step": 2905,
"valid_targets_mean": 8009.3,
"valid_targets_min": 7512
},
{
"epoch": 5.114235500878735,
"grad_norm": 0.35478320721312395,
"learning_rate": 8.227281805535361e-06,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28927919268608093,
"step": 2910,
"valid_targets_mean": 7800.7,
"valid_targets_min": 7136
},
{
"epoch": 5.1230228471001755,
"grad_norm": 0.31733616916369456,
"learning_rate": 8.156534107720362e-06,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2826761305332184,
"step": 2915,
"valid_targets_mean": 8438.5,
"valid_targets_min": 6931
},
{
"epoch": 5.131810193321617,
"grad_norm": 0.3272931666609286,
"learning_rate": 8.086013910151334e-06,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28670844435691833,
"step": 2920,
"valid_targets_mean": 7635.8,
"valid_targets_min": 4770
},
{
"epoch": 5.140597539543058,
"grad_norm": 0.32440078909074577,
"learning_rate": 8.015722567445463e-06,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28524067997932434,
"step": 2925,
"valid_targets_mean": 8409.3,
"valid_targets_min": 6404
},
{
"epoch": 5.1493848857644995,
"grad_norm": 0.32721388026046155,
"learning_rate": 7.94566142982385e-06,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29583433270454407,
"step": 2930,
"valid_targets_mean": 7790.6,
"valid_targets_min": 6812
},
{
"epoch": 5.15817223198594,
"grad_norm": 0.3363730851372013,
"learning_rate": 7.87583184308564e-06,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30835360288619995,
"step": 2935,
"valid_targets_mean": 7662.2,
"valid_targets_min": 7033
},
{
"epoch": 5.166959578207381,
"grad_norm": 0.3376536343834321,
"learning_rate": 7.806235148582102e-06,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28265395760536194,
"step": 2940,
"valid_targets_mean": 7519.6,
"valid_targets_min": 6717
},
{
"epoch": 5.175746924428823,
"grad_norm": 0.33596721819738473,
"learning_rate": 7.736872683190906e-06,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2899321913719177,
"step": 2945,
"valid_targets_mean": 7700.2,
"valid_targets_min": 6626
},
{
"epoch": 5.184534270650263,
"grad_norm": 0.33848326395647726,
"learning_rate": 7.66774577929045e-06,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2899055480957031,
"step": 2950,
"valid_targets_mean": 7385.9,
"valid_targets_min": 6481
},
{
"epoch": 5.193321616871705,
"grad_norm": 0.31778300423572214,
"learning_rate": 7.598855764734217e-06,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29572445154190063,
"step": 2955,
"valid_targets_mean": 8673.2,
"valid_targets_min": 6638
},
{
"epoch": 5.202108963093146,
"grad_norm": 0.36268069305068357,
"learning_rate": 7.530203962825331e-06,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2874404191970825,
"step": 2960,
"valid_targets_mean": 7848.9,
"valid_targets_min": 7071
},
{
"epoch": 5.210896309314587,
"grad_norm": 0.3466580768009033,
"learning_rate": 7.461791692291085e-06,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2909945845603943,
"step": 2965,
"valid_targets_mean": 7791.6,
"valid_targets_min": 6440
},
{
"epoch": 5.219683655536028,
"grad_norm": 0.3547485147268179,
"learning_rate": 7.3936202672576485e-06,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970777750015259,
"step": 2970,
"valid_targets_mean": 7487.3,
"valid_targets_min": 6296
},
{
"epoch": 5.22847100175747,
"grad_norm": 0.3496834096686977,
"learning_rate": 7.3256909972247994e-06,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2900811433792114,
"step": 2975,
"valid_targets_mean": 7673.6,
"valid_targets_min": 6741
},
{
"epoch": 5.23725834797891,
"grad_norm": 0.35893075162077176,
"learning_rate": 7.258005187040773e-06,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27755802869796753,
"step": 2980,
"valid_targets_mean": 7717.8,
"valid_targets_min": 6803
},
{
"epoch": 5.246045694200351,
"grad_norm": 0.32560513681456177,
"learning_rate": 7.190564136877207e-06,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886160612106323,
"step": 2985,
"valid_targets_mean": 8614.1,
"valid_targets_min": 7106
},
{
"epoch": 5.254833040421793,
"grad_norm": 0.33155285929884837,
"learning_rate": 7.123369142204175e-06,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29632484912872314,
"step": 2990,
"valid_targets_mean": 8658.5,
"valid_targets_min": 6773
},
{
"epoch": 5.263620386643233,
"grad_norm": 0.32276511243341377,
"learning_rate": 7.0564214937652645e-06,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2822602689266205,
"step": 2995,
"valid_targets_mean": 7759.1,
"valid_targets_min": 6526
},
{
"epoch": 5.272407732864675,
"grad_norm": 0.3225226923127115,
"learning_rate": 6.989722477552836e-06,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978208661079407,
"step": 3000,
"valid_targets_mean": 8548.8,
"valid_targets_min": 6610
},
{
"epoch": 5.281195079086116,
"grad_norm": 0.3205604405307989,
"learning_rate": 6.923273374783264e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28816479444503784,
"step": 3005,
"valid_targets_mean": 7833.6,
"valid_targets_min": 7200
},
{
"epoch": 5.289982425307557,
"grad_norm": 0.3340979255742489,
"learning_rate": 6.857075461872382e-06,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28635507822036743,
"step": 3010,
"valid_targets_mean": 7720.8,
"valid_targets_min": 6787
},
{
"epoch": 5.298769771528998,
"grad_norm": 0.3298534039786586,
"learning_rate": 6.7911300104109155e-06,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2974523901939392,
"step": 3015,
"valid_targets_mean": 7698.7,
"valid_targets_min": 6677
},
{
"epoch": 5.30755711775044,
"grad_norm": 0.31223988004936154,
"learning_rate": 6.725438287140076e-06,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27365636825561523,
"step": 3020,
"valid_targets_mean": 7658.8,
"valid_targets_min": 7101
},
{
"epoch": 5.31634446397188,
"grad_norm": 0.36712903682229575,
"learning_rate": 6.6600015539272535e-06,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3002887964248657,
"step": 3025,
"valid_targets_mean": 8573.8,
"valid_targets_min": 6856
},
{
"epoch": 5.325131810193321,
"grad_norm": 0.3245992026219487,
"learning_rate": 6.594821067741719e-06,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2914707362651825,
"step": 3030,
"valid_targets_mean": 7622.3,
"valid_targets_min": 6711
},
{
"epoch": 5.333919156414763,
"grad_norm": 0.39660825238437414,
"learning_rate": 6.529898080630552e-06,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2940986752510071,
"step": 3035,
"valid_targets_mean": 7386.1,
"valid_targets_min": 6117
},
{
"epoch": 5.3427065026362035,
"grad_norm": 0.3520229343804998,
"learning_rate": 6.465233839694511e-06,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2902158498764038,
"step": 3040,
"valid_targets_mean": 7599.2,
"valid_targets_min": 6327
},
{
"epoch": 5.351493848857645,
"grad_norm": 0.3448557608828672,
"learning_rate": 6.400829587064163e-06,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28602784872055054,
"step": 3045,
"valid_targets_mean": 7692.1,
"valid_targets_min": 6804
},
{
"epoch": 5.360281195079086,
"grad_norm": 0.32636497092417743,
"learning_rate": 6.3366865598759285e-06,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29605281352996826,
"step": 3050,
"valid_targets_mean": 9081.4,
"valid_targets_min": 6809
},
{
"epoch": 5.3690685413005275,
"grad_norm": 0.3248539671966316,
"learning_rate": 6.272805990248412e-06,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.288605272769928,
"step": 3055,
"valid_targets_mean": 8345.0,
"valid_targets_min": 6517
},
{
"epoch": 5.377855887521968,
"grad_norm": 0.3735371901400926,
"learning_rate": 6.209189105258661e-06,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30450695753097534,
"step": 3060,
"valid_targets_mean": 7874.4,
"valid_targets_min": 6518
},
{
"epoch": 5.38664323374341,
"grad_norm": 0.3163172048772757,
"learning_rate": 6.145837126918652e-06,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29120033979415894,
"step": 3065,
"valid_targets_mean": 7761.3,
"valid_targets_min": 6781
},
{
"epoch": 5.3954305799648505,
"grad_norm": 0.33063399197041154,
"learning_rate": 6.082751272151759e-06,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2947753071784973,
"step": 3070,
"valid_targets_mean": 8314.8,
"valid_targets_min": 5829
},
{
"epoch": 5.404217926186292,
"grad_norm": 0.31418920675480283,
"learning_rate": 6.019932752769437e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27883777022361755,
"step": 3075,
"valid_targets_mean": 8160.8,
"valid_targets_min": 1058
},
{
"epoch": 5.413005272407733,
"grad_norm": 0.32573627836397306,
"learning_rate": 5.957382775447897e-06,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2857188284397125,
"step": 3080,
"valid_targets_mean": 7901.0,
"valid_targets_min": 7341
},
{
"epoch": 5.421792618629174,
"grad_norm": 0.3271273381515411,
"learning_rate": 5.895102541704944e-06,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29406070709228516,
"step": 3085,
"valid_targets_mean": 8175.0,
"valid_targets_min": 6945
},
{
"epoch": 5.430579964850615,
"grad_norm": 0.3293770941002359,
"learning_rate": 5.833093247876918e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789419889450073,
"step": 3090,
"valid_targets_mean": 7789.3,
"valid_targets_min": 7058
},
{
"epoch": 5.439367311072056,
"grad_norm": 0.323465702779747,
"learning_rate": 5.771356085095669e-06,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898038923740387,
"step": 3095,
"valid_targets_mean": 7763.9,
"valid_targets_min": 6742
},
{
"epoch": 5.448154657293498,
"grad_norm": 0.32735629336514316,
"learning_rate": 5.709892239265733e-06,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28642818331718445,
"step": 3100,
"valid_targets_mean": 7992.3,
"valid_targets_min": 6744
},
{
"epoch": 5.456942003514938,
"grad_norm": 0.3298517561331294,
"learning_rate": 5.648702891041486e-06,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27885934710502625,
"step": 3105,
"valid_targets_mean": 7718.9,
"valid_targets_min": 6823
},
{
"epoch": 5.46572934973638,
"grad_norm": 0.30381787832315504,
"learning_rate": 5.5877892158045335e-06,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.297435998916626,
"step": 3110,
"valid_targets_mean": 8274.4,
"valid_targets_min": 5183
},
{
"epoch": 5.474516695957821,
"grad_norm": 0.33243040819665437,
"learning_rate": 5.527152383641074e-06,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2871898412704468,
"step": 3115,
"valid_targets_mean": 7849.6,
"valid_targets_min": 7020
},
{
"epoch": 5.483304042179262,
"grad_norm": 0.31558816610328144,
"learning_rate": 5.4667935593194635e-06,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.280933678150177,
"step": 3120,
"valid_targets_mean": 7688.6,
"valid_targets_min": 6730
},
{
"epoch": 5.492091388400703,
"grad_norm": 0.3356246422039742,
"learning_rate": 5.406713902267812e-06,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29142051935195923,
"step": 3125,
"valid_targets_mean": 7132.3,
"valid_targets_min": 722
},
{
"epoch": 5.500878734622145,
"grad_norm": 0.3252334996601614,
"learning_rate": 5.346914566551746e-06,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894833981990814,
"step": 3130,
"valid_targets_mean": 7597.6,
"valid_targets_min": 6517
},
{
"epoch": 5.509666080843585,
"grad_norm": 0.30440359940776446,
"learning_rate": 5.2873967008522006e-06,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2687520980834961,
"step": 3135,
"valid_targets_mean": 8643.2,
"valid_targets_min": 6955
},
{
"epoch": 5.518453427065026,
"grad_norm": 0.33056583512431303,
"learning_rate": 5.228161448443394e-06,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3093627691268921,
"step": 3140,
"valid_targets_mean": 7529.2,
"valid_targets_min": 6591
},
{
"epoch": 5.527240773286468,
"grad_norm": 0.3267302005382248,
"learning_rate": 5.169209947170824e-06,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30785757303237915,
"step": 3145,
"valid_targets_mean": 8656.3,
"valid_targets_min": 6753
},
{
"epoch": 5.536028119507908,
"grad_norm": 0.33200499804961403,
"learning_rate": 5.1105433294294605e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28961071372032166,
"step": 3150,
"valid_targets_mean": 7703.8,
"valid_targets_min": 6934
},
{
"epoch": 5.54481546572935,
"grad_norm": 0.33658932971818206,
"learning_rate": 5.052162722141946e-06,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898900806903839,
"step": 3155,
"valid_targets_mean": 7618.9,
"valid_targets_min": 6719
},
{
"epoch": 5.553602811950791,
"grad_norm": 0.3104483049157492,
"learning_rate": 4.994069246736973e-06,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2733854055404663,
"step": 3160,
"valid_targets_mean": 7678.3,
"valid_targets_min": 6911
},
{
"epoch": 5.562390158172232,
"grad_norm": 0.335513612906866,
"learning_rate": 4.9362640191277526e-06,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28684091567993164,
"step": 3165,
"valid_targets_mean": 7808.9,
"valid_targets_min": 6153
},
{
"epoch": 5.571177504393673,
"grad_norm": 0.3165281390328353,
"learning_rate": 4.878748149690544e-06,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29210197925567627,
"step": 3170,
"valid_targets_mean": 8098.0,
"valid_targets_min": 7111
},
{
"epoch": 5.579964850615115,
"grad_norm": 0.33012053945102526,
"learning_rate": 4.821522743243377e-06,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29123449325561523,
"step": 3175,
"valid_targets_mean": 7574.3,
"valid_targets_min": 6840
},
{
"epoch": 5.588752196836555,
"grad_norm": 0.31868590805039276,
"learning_rate": 4.764588899024763e-06,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26774659752845764,
"step": 3180,
"valid_targets_mean": 7745.1,
"valid_targets_min": 6969
},
{
"epoch": 5.597539543057996,
"grad_norm": 0.3030971493993999,
"learning_rate": 4.7079477106726576e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2700444459915161,
"step": 3185,
"valid_targets_mean": 8861.1,
"valid_targets_min": 6313
},
{
"epoch": 5.606326889279438,
"grad_norm": 0.31712976658654685,
"learning_rate": 4.6516002662033645e-06,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27993258833885193,
"step": 3190,
"valid_targets_mean": 7806.2,
"valid_targets_min": 6749
},
{
"epoch": 5.6151142355008785,
"grad_norm": 0.3123065680907856,
"learning_rate": 4.595547647990725e-06,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28896477818489075,
"step": 3195,
"valid_targets_mean": 8011.1,
"valid_targets_min": 6719
},
{
"epoch": 5.62390158172232,
"grad_norm": 0.32853539593068376,
"learning_rate": 4.53979093274526e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29997682571411133,
"step": 3200,
"valid_targets_mean": 8496.4,
"valid_targets_min": 6859
},
{
"epoch": 5.632688927943761,
"grad_norm": 0.341458589626131,
"learning_rate": 4.484331191493532e-06,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28483325242996216,
"step": 3205,
"valid_targets_mean": 8154.6,
"valid_targets_min": 7068
},
{
"epoch": 5.6414762741652025,
"grad_norm": 0.31495834405447776,
"learning_rate": 4.429169489557528e-06,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851713001728058,
"step": 3210,
"valid_targets_mean": 7686.2,
"valid_targets_min": 6387
},
{
"epoch": 5.650263620386643,
"grad_norm": 0.29999185071692785,
"learning_rate": 4.374306886534248e-06,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28340470790863037,
"step": 3215,
"valid_targets_mean": 8562.3,
"valid_targets_min": 6326
},
{
"epoch": 5.659050966608085,
"grad_norm": 0.3231664440148963,
"learning_rate": 4.3197444362752994e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2838216722011566,
"step": 3220,
"valid_targets_mean": 7336.6,
"valid_targets_min": 709
},
{
"epoch": 5.6678383128295255,
"grad_norm": 0.30672227936405144,
"learning_rate": 4.265483186866688e-06,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2630815804004669,
"step": 3225,
"valid_targets_mean": 8641.6,
"valid_targets_min": 6861
},
{
"epoch": 5.676625659050966,
"grad_norm": 0.3377876014310014,
"learning_rate": 4.211524180608672e-06,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870168685913086,
"step": 3230,
"valid_targets_mean": 7735.8,
"valid_targets_min": 6915
},
{
"epoch": 5.685413005272408,
"grad_norm": 0.31001235576301167,
"learning_rate": 4.157868453995757e-06,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28175193071365356,
"step": 3235,
"valid_targets_mean": 8350.0,
"valid_targets_min": 6625
},
{
"epoch": 5.694200351493849,
"grad_norm": 0.31083908749481165,
"learning_rate": 4.104517037696749e-06,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27868616580963135,
"step": 3240,
"valid_targets_mean": 8633.8,
"valid_targets_min": 7194
},
{
"epoch": 5.70298769771529,
"grad_norm": 0.32191431288817535,
"learning_rate": 4.051470956535004e-06,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29141765832901,
"step": 3245,
"valid_targets_mean": 7639.6,
"valid_targets_min": 6344
},
{
"epoch": 5.711775043936731,
"grad_norm": 0.3396193057167186,
"learning_rate": 3.998731229468697e-06,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2942695915699005,
"step": 3250,
"valid_targets_mean": 7783.9,
"valid_targets_min": 7334
},
{
"epoch": 5.720562390158173,
"grad_norm": 0.3092604067668136,
"learning_rate": 3.94629886957129e-06,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28806155920028687,
"step": 3255,
"valid_targets_mean": 7493.6,
"valid_targets_min": 5869
},
{
"epoch": 5.729349736379613,
"grad_norm": 0.3292858311037341,
"learning_rate": 3.8941748840120404e-06,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290735125541687,
"step": 3260,
"valid_targets_mean": 7823.6,
"valid_targets_min": 7275
},
{
"epoch": 5.738137082601055,
"grad_norm": 0.32174230635297546,
"learning_rate": 3.842360274036658e-06,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30042213201522827,
"step": 3265,
"valid_targets_mean": 7548.5,
"valid_targets_min": 6556
},
{
"epoch": 5.746924428822496,
"grad_norm": 0.3150931499885214,
"learning_rate": 3.7908560349481072e-06,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.296764612197876,
"step": 3270,
"valid_targets_mean": 8671.5,
"valid_targets_min": 6838
},
{
"epoch": 5.755711775043936,
"grad_norm": 0.3251774095699638,
"learning_rate": 3.7396631560874296e-06,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2913369834423065,
"step": 3275,
"valid_targets_mean": 7595.5,
"valid_targets_min": 4779
},
{
"epoch": 5.764499121265378,
"grad_norm": 0.29806093139480805,
"learning_rate": 3.6887826208147968e-06,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796759605407715,
"step": 3280,
"valid_targets_mean": 8333.2,
"valid_targets_min": 6872
},
{
"epoch": 5.773286467486819,
"grad_norm": 0.32196531471289125,
"learning_rate": 3.6382154064905794e-06,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2924780547618866,
"step": 3285,
"valid_targets_mean": 7810.5,
"valid_targets_min": 6153
},
{
"epoch": 5.78207381370826,
"grad_norm": 0.31002178625719085,
"learning_rate": 3.587962484456611e-06,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780643403530121,
"step": 3290,
"valid_targets_mean": 7344.2,
"valid_targets_min": 889
},
{
"epoch": 5.790861159929701,
"grad_norm": 0.3337355043722275,
"learning_rate": 3.538024820017467e-06,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.294627845287323,
"step": 3295,
"valid_targets_mean": 8312.8,
"valid_targets_min": 7030
},
{
"epoch": 5.799648506151143,
"grad_norm": 0.312698283528566,
"learning_rate": 3.488403372422011e-06,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884920835494995,
"step": 3300,
"valid_targets_mean": 8300.7,
"valid_targets_min": 6396
},
{
"epoch": 5.808435852372583,
"grad_norm": 0.3091039350887255,
"learning_rate": 3.4390990948448867e-06,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812803387641907,
"step": 3305,
"valid_targets_mean": 8493.2,
"valid_targets_min": 6773
},
{
"epoch": 5.817223198594025,
"grad_norm": 0.31877137936357625,
"learning_rate": 3.390112934368266e-06,
"loss": 0.2909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27986976504325867,
"step": 3310,
"valid_targets_mean": 7588.8,
"valid_targets_min": 6270
},
{
"epoch": 5.826010544815466,
"grad_norm": 0.3171231931848898,
"learning_rate": 3.3414458319636124e-06,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28334343433380127,
"step": 3315,
"valid_targets_mean": 7865.8,
"valid_targets_min": 7421
},
{
"epoch": 5.8347978910369065,
"grad_norm": 0.351307724929885,
"learning_rate": 3.2930987224736465e-06,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3002662658691406,
"step": 3320,
"valid_targets_mean": 6947.4,
"valid_targets_min": 2881
},
{
"epoch": 5.843585237258348,
"grad_norm": 0.33358711919009776,
"learning_rate": 3.2450725345943577e-06,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27923858165740967,
"step": 3325,
"valid_targets_mean": 7789.2,
"valid_targets_min": 6921
},
{
"epoch": 5.852372583479789,
"grad_norm": 0.3414208492312931,
"learning_rate": 3.197368190857173e-06,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2987247705459595,
"step": 3330,
"valid_targets_mean": 7808.4,
"valid_targets_min": 6834
},
{
"epoch": 5.8611599297012305,
"grad_norm": 0.3348762946692922,
"learning_rate": 3.149986607611253e-06,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956831455230713,
"step": 3335,
"valid_targets_mean": 7496.1,
"valid_targets_min": 6456
},
{
"epoch": 5.869947275922671,
"grad_norm": 0.3448410739256257,
"learning_rate": 3.102928695005858e-06,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2887445390224457,
"step": 3340,
"valid_targets_mean": 7771.7,
"valid_targets_min": 7171
},
{
"epoch": 5.878734622144113,
"grad_norm": 0.3043444067789503,
"learning_rate": 3.0561953569729064e-06,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28372079133987427,
"step": 3345,
"valid_targets_mean": 7517.8,
"valid_targets_min": 6720
},
{
"epoch": 5.8875219683655535,
"grad_norm": 0.3164874212248818,
"learning_rate": 3.0097874912095636e-06,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29748934507369995,
"step": 3350,
"valid_targets_mean": 8516.9,
"valid_targets_min": 7389
},
{
"epoch": 5.896309314586995,
"grad_norm": 0.32852926202032856,
"learning_rate": 2.9637059891610452e-06,
"loss": 0.297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930929660797119,
"step": 3355,
"valid_targets_mean": 7919.1,
"valid_targets_min": 7175
},
{
"epoch": 5.905096660808436,
"grad_norm": 0.9335255021053942,
"learning_rate": 2.9179517360034526e-06,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28942394256591797,
"step": 3360,
"valid_targets_mean": 7831.2,
"valid_targets_min": 5375
},
{
"epoch": 5.913884007029877,
"grad_norm": 0.33951614009792314,
"learning_rate": 2.872525610626797e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3013302981853485,
"step": 3365,
"valid_targets_mean": 8491.2,
"valid_targets_min": 7200
},
{
"epoch": 5.922671353251318,
"grad_norm": 0.31883626036243257,
"learning_rate": 2.827428485618102e-06,
"loss": 0.295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28803277015686035,
"step": 3370,
"valid_targets_mean": 8212.4,
"valid_targets_min": 5811
},
{
"epoch": 5.931458699472759,
"grad_norm": 0.2878749967770179,
"learning_rate": 2.7826612272446584e-06,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2861100137233734,
"step": 3375,
"valid_targets_mean": 8553.2,
"valid_targets_min": 6438
},
{
"epoch": 5.940246045694201,
"grad_norm": 0.2985617783397011,
"learning_rate": 2.738224695437357e-06,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2832047641277313,
"step": 3380,
"valid_targets_mean": 8549.3,
"valid_targets_min": 7163
},
{
"epoch": 5.949033391915641,
"grad_norm": 0.32595062411682413,
"learning_rate": 2.6941197437742105e-06,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29271990060806274,
"step": 3385,
"valid_targets_mean": 7661.8,
"valid_targets_min": 6983
},
{
"epoch": 5.957820738137083,
"grad_norm": 0.31020871319992316,
"learning_rate": 2.650347219463907e-06,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28285855054855347,
"step": 3390,
"valid_targets_mean": 8599.2,
"valid_targets_min": 7033
},
{
"epoch": 5.966608084358524,
"grad_norm": 0.31645890810904653,
"learning_rate": 2.6069079633295858e-06,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930651903152466,
"step": 3395,
"valid_targets_mean": 7556.0,
"valid_targets_min": 6435
},
{
"epoch": 5.975395430579965,
"grad_norm": 0.3164728752307686,
"learning_rate": 2.563802809792646e-06,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29243242740631104,
"step": 3400,
"valid_targets_mean": 7732.3,
"valid_targets_min": 6723
},
{
"epoch": 5.984182776801406,
"grad_norm": 0.3400353139390024,
"learning_rate": 2.52103258685674e-06,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30362796783447266,
"step": 3405,
"valid_targets_mean": 7429.9,
"valid_targets_min": 941
},
{
"epoch": 5.992970123022847,
"grad_norm": 0.3333200137211664,
"learning_rate": 2.4785981160918703e-06,
"loss": 0.2847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2824479937553406,
"step": 3410,
"valid_targets_mean": 7657.1,
"valid_targets_min": 7075
},
{
"epoch": 6.001757469244288,
"grad_norm": 0.3095648198654591,
"learning_rate": 2.436500212618589e-06,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2807752192020416,
"step": 3415,
"valid_targets_mean": 7814.2,
"valid_targets_min": 6749
},
{
"epoch": 6.010544815465729,
"grad_norm": 0.3075173199504854,
"learning_rate": 2.3947396850923664e-06,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2928026616573334,
"step": 3420,
"valid_targets_mean": 7933.4,
"valid_targets_min": 7239
},
{
"epoch": 6.019332161687171,
"grad_norm": 0.299535909340376,
"learning_rate": 2.35331733568803e-06,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292161762714386,
"step": 3425,
"valid_targets_mean": 8519.8,
"valid_targets_min": 6248
},
{
"epoch": 6.028119507908611,
"grad_norm": 0.32022750824787705,
"learning_rate": 2.312233960084389e-06,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2915361225605011,
"step": 3430,
"valid_targets_mean": 7603.8,
"valid_targets_min": 6706
},
{
"epoch": 6.036906854130053,
"grad_norm": 0.33443315293974885,
"learning_rate": 2.271490347448895e-06,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2938150465488434,
"step": 3435,
"valid_targets_mean": 7733.7,
"valid_targets_min": 7175
},
{
"epoch": 6.045694200351494,
"grad_norm": 0.3258133355986156,
"learning_rate": 2.231087280422557e-06,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28791695833206177,
"step": 3440,
"valid_targets_mean": 7775.0,
"valid_targets_min": 7127
},
{
"epoch": 6.054481546572935,
"grad_norm": 0.3422113528790867,
"learning_rate": 2.1910255351048426e-06,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992529273033142,
"step": 3445,
"valid_targets_mean": 7713.1,
"valid_targets_min": 6958
},
{
"epoch": 6.063268892794376,
"grad_norm": 0.33857272608122346,
"learning_rate": 2.151305881038814e-06,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28023239970207214,
"step": 3450,
"valid_targets_mean": 7220.9,
"valid_targets_min": 1058
},
{
"epoch": 6.072056239015817,
"grad_norm": 0.3093639323935716,
"learning_rate": 2.1119290811963134e-06,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2893432378768921,
"step": 3455,
"valid_targets_mean": 7880.4,
"valid_targets_min": 6603
},
{
"epoch": 6.080843585237258,
"grad_norm": 0.30417854651758086,
"learning_rate": 2.0728958919633337e-06,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948586642742157,
"step": 3460,
"valid_targets_mean": 7946.2,
"valid_targets_min": 7028
},
{
"epoch": 6.089630931458699,
"grad_norm": 0.3131048355787601,
"learning_rate": 2.034207063125473e-06,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28712961077690125,
"step": 3465,
"valid_targets_mean": 7673.6,
"valid_targets_min": 6837
},
{
"epoch": 6.098418277680141,
"grad_norm": 0.44135555559021356,
"learning_rate": 1.9958633378535277e-06,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27640682458877563,
"step": 3470,
"valid_targets_mean": 8458.7,
"valid_targets_min": 6296
},
{
"epoch": 6.1072056239015815,
"grad_norm": 0.3231106733854511,
"learning_rate": 1.9578654526892425e-06,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28280821442604065,
"step": 3475,
"valid_targets_mean": 7895.6,
"valid_targets_min": 7455
},
{
"epoch": 6.115992970123023,
"grad_norm": 0.308903440119535,
"learning_rate": 1.9202141375311335e-06,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916829288005829,
"step": 3480,
"valid_targets_mean": 7596.1,
"valid_targets_min": 6547
},
{
"epoch": 6.124780316344464,
"grad_norm": 0.32006985936416427,
"learning_rate": 1.8829101156204844e-06,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005526065826416,
"step": 3485,
"valid_targets_mean": 7917.9,
"valid_targets_min": 6744
},
{
"epoch": 6.1335676625659055,
"grad_norm": 0.3266735247756828,
"learning_rate": 1.8459541035274453e-06,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2887221574783325,
"step": 3490,
"valid_targets_mean": 7609.4,
"valid_targets_min": 6882
},
{
"epoch": 6.142355008787346,
"grad_norm": 0.3030295623224466,
"learning_rate": 1.8093468111372802e-06,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28173595666885376,
"step": 3495,
"valid_targets_mean": 7799.6,
"valid_targets_min": 6645
},
{
"epoch": 6.151142355008787,
"grad_norm": 0.3211889651008717,
"learning_rate": 1.7730889416367115e-06,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2866337299346924,
"step": 3500,
"valid_targets_mean": 7365.6,
"valid_targets_min": 685
},
{
"epoch": 6.1599297012302285,
"grad_norm": 0.31769129512356303,
"learning_rate": 1.73718119150043e-06,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2844308614730835,
"step": 3505,
"valid_targets_mean": 7739.8,
"valid_targets_min": 7015
},
{
"epoch": 6.168717047451669,
"grad_norm": 0.2887437522654917,
"learning_rate": 1.7016242504777048e-06,
"loss": 0.2871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2782225012779236,
"step": 3510,
"valid_targets_mean": 8382.1,
"valid_targets_min": 6670
},
{
"epoch": 6.177504393673111,
"grad_norm": 0.3196770566443562,
"learning_rate": 1.6664188015791484e-06,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772035002708435,
"step": 3515,
"valid_targets_mean": 7498.5,
"valid_targets_min": 4799
},
{
"epoch": 6.186291739894552,
"grad_norm": 0.2886453087922719,
"learning_rate": 1.6315655210635784e-06,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28373849391937256,
"step": 3520,
"valid_targets_mean": 9234.0,
"valid_targets_min": 6924
},
{
"epoch": 6.195079086115993,
"grad_norm": 0.31452567443023266,
"learning_rate": 1.5970650784250442e-06,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3046089708805084,
"step": 3525,
"valid_targets_mean": 7534.6,
"valid_targets_min": 6593
},
{
"epoch": 6.203866432337434,
"grad_norm": 0.33171229659648493,
"learning_rate": 1.5629181363799517e-06,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304110050201416,
"step": 3530,
"valid_targets_mean": 7414.1,
"valid_targets_min": 4643
},
{
"epoch": 6.212653778558876,
"grad_norm": 0.3241057334603984,
"learning_rate": 1.5291253508543458e-06,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2967751622200012,
"step": 3535,
"valid_targets_mean": 7636.1,
"valid_targets_min": 6327
},
{
"epoch": 6.221441124780316,
"grad_norm": 0.29597922977914076,
"learning_rate": 1.4956873709713016e-06,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2816871106624603,
"step": 3540,
"valid_targets_mean": 8233.2,
"valid_targets_min": 6758
},
{
"epoch": 6.230228471001757,
"grad_norm": 0.32662913224841694,
"learning_rate": 1.4626048390384573e-06,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29462772607803345,
"step": 3545,
"valid_targets_mean": 7599.8,
"valid_targets_min": 6835
},
{
"epoch": 6.239015817223199,
"grad_norm": 0.28643663955838083,
"learning_rate": 1.4298783905356906e-06,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688906192779541,
"step": 3550,
"valid_targets_mean": 8510.6,
"valid_targets_min": 7169
},
{
"epoch": 6.247803163444639,
"grad_norm": 0.31827582182584874,
"learning_rate": 1.3975086541028815e-06,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28534990549087524,
"step": 3555,
"valid_targets_mean": 7687.6,
"valid_targets_min": 6288
},
{
"epoch": 6.256590509666081,
"grad_norm": 0.2991456687508091,
"learning_rate": 1.3654962515278692e-06,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2955605089664459,
"step": 3560,
"valid_targets_mean": 8628.6,
"valid_targets_min": 7094
},
{
"epoch": 6.265377855887522,
"grad_norm": 0.3319859213632947,
"learning_rate": 1.3338417977344853e-06,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28525975346565247,
"step": 3565,
"valid_targets_mean": 7747.8,
"valid_targets_min": 6890
},
{
"epoch": 6.274165202108963,
"grad_norm": 0.32759436127422603,
"learning_rate": 1.302545900770762e-06,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28943735361099243,
"step": 3570,
"valid_targets_mean": 8275.8,
"valid_targets_min": 6800
},
{
"epoch": 6.282952548330404,
"grad_norm": 0.3306183716934296,
"learning_rate": 1.2716091617972159e-06,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28983038663864136,
"step": 3575,
"valid_targets_mean": 7270.4,
"valid_targets_min": 791
},
{
"epoch": 6.291739894551846,
"grad_norm": 0.288156104658097,
"learning_rate": 1.2410321750753518e-06,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2841329574584961,
"step": 3580,
"valid_targets_mean": 8245.0,
"valid_targets_min": 7001
},
{
"epoch": 6.300527240773286,
"grad_norm": 0.3189483618108163,
"learning_rate": 1.2108155279562017e-06,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2912044823169708,
"step": 3585,
"valid_targets_mean": 8160.7,
"valid_targets_min": 6868
},
{
"epoch": 6.309314586994727,
"grad_norm": 0.3162820394259654,
"learning_rate": 1.180959800869077e-06,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28558826446533203,
"step": 3590,
"valid_targets_mean": 7097.2,
"valid_targets_min": 942
},
{
"epoch": 6.318101933216169,
"grad_norm": 0.3227516251151931,
"learning_rate": 1.1514655673103857e-06,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29469990730285645,
"step": 3595,
"valid_targets_mean": 7176.0,
"valid_targets_min": 953
},
{
"epoch": 6.3268892794376095,
"grad_norm": 0.30824799317875473,
"learning_rate": 1.1223333938326486e-06,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2922055125236511,
"step": 3600,
"valid_targets_mean": 8607.1,
"valid_targets_min": 7140
},
{
"epoch": 6.335676625659051,
"grad_norm": 0.30642048579731107,
"learning_rate": 1.0935638400335979e-06,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27427494525909424,
"step": 3605,
"valid_targets_mean": 7716.3,
"valid_targets_min": 6915
},
{
"epoch": 6.344463971880492,
"grad_norm": 0.312070601993189,
"learning_rate": 1.0651574585454228e-06,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751944065093994,
"step": 3610,
"valid_targets_mean": 7600.4,
"valid_targets_min": 6989
},
{
"epoch": 6.353251318101933,
"grad_norm": 0.321136362911428,
"learning_rate": 1.0371147950241745e-06,
"loss": 0.2861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2760077714920044,
"step": 3615,
"valid_targets_mean": 7750.4,
"valid_targets_min": 6813
},
{
"epoch": 6.362038664323374,
"grad_norm": 0.31382693813094326,
"learning_rate": 1.0094363881392665e-06,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2901709973812103,
"step": 3620,
"valid_targets_mean": 7908.2,
"valid_targets_min": 7082
},
{
"epoch": 6.370826010544816,
"grad_norm": 0.2981295280096082,
"learning_rate": 9.821227695631386e-07,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29155126214027405,
"step": 3625,
"valid_targets_mean": 8371.8,
"valid_targets_min": 6965
},
{
"epoch": 6.3796133567662565,
"grad_norm": 0.3109551271191042,
"learning_rate": 9.551744639610328e-07,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29289332032203674,
"step": 3630,
"valid_targets_mean": 7768.1,
"valid_targets_min": 6719
},
{
"epoch": 6.388400702987697,
"grad_norm": 0.31434253460561856,
"learning_rate": 9.285919889809314e-07,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28384581208229065,
"step": 3635,
"valid_targets_mean": 7665.1,
"valid_targets_min": 6037
},
{
"epoch": 6.397188049209139,
"grad_norm": 0.3092004304420906,
"learning_rate": 9.023758552435935e-07,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28531426191329956,
"step": 3640,
"valid_targets_mean": 7512.6,
"valid_targets_min": 6270
},
{
"epoch": 6.40597539543058,
"grad_norm": 0.29452660133273145,
"learning_rate": 8.765265663327605e-07,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935437560081482,
"step": 3645,
"valid_targets_mean": 8569.4,
"valid_targets_min": 7046
},
{
"epoch": 6.414762741652021,
"grad_norm": 0.3228870917587924,
"learning_rate": 8.510446187854793e-07,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30004414916038513,
"step": 3650,
"valid_targets_mean": 7375.8,
"valid_targets_min": 1943
},
{
"epoch": 6.423550087873462,
"grad_norm": 0.2939772904058792,
"learning_rate": 8.259305020825703e-07,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851170003414154,
"step": 3655,
"valid_targets_mean": 8229.3,
"valid_targets_min": 5952
},
{
"epoch": 6.4323374340949035,
"grad_norm": 0.31427818308611555,
"learning_rate": 8.011846986392058e-07,
"loss": 0.2917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28981322050094604,
"step": 3660,
"valid_targets_mean": 7931.1,
"valid_targets_min": 6975
},
{
"epoch": 6.441124780316344,
"grad_norm": 0.3041927647921443,
"learning_rate": 7.768076837956728e-07,
"loss": 0.2929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28967010974884033,
"step": 3665,
"valid_targets_mean": 8059.9,
"valid_targets_min": 6901
},
{
"epoch": 6.449912126537786,
"grad_norm": 0.309905165653539,
"learning_rate": 7.527999258082052e-07,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.293418288230896,
"step": 3670,
"valid_targets_mean": 7485.3,
"valid_targets_min": 6300
},
{
"epoch": 6.458699472759227,
"grad_norm": 0.3188919596891954,
"learning_rate": 7.291618858400329e-07,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3023364841938019,
"step": 3675,
"valid_targets_mean": 8096.2,
"valid_targets_min": 598
},
{
"epoch": 6.467486818980668,
"grad_norm": 0.31250436474473514,
"learning_rate": 7.058940179524842e-07,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28131306171417236,
"step": 3680,
"valid_targets_mean": 7808.1,
"valid_targets_min": 6935
},
{
"epoch": 6.476274165202109,
"grad_norm": 0.32620003785829454,
"learning_rate": 6.829967690962802e-07,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2991110682487488,
"step": 3685,
"valid_targets_mean": 7430.6,
"valid_targets_min": 3281
},
{
"epoch": 6.48506151142355,
"grad_norm": 0.32019753496373277,
"learning_rate": 6.604705791029586e-07,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2853609025478363,
"step": 3690,
"valid_targets_mean": 7720.6,
"valid_targets_min": 7246
},
{
"epoch": 6.493848857644991,
"grad_norm": 0.3328672541361672,
"learning_rate": 6.383158806764056e-07,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3027670383453369,
"step": 3695,
"valid_targets_mean": 7264.8,
"valid_targets_min": 1832
},
{
"epoch": 6.502636203866432,
"grad_norm": 0.31555792657873133,
"learning_rate": 6.165330993845598e-07,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2928489148616791,
"step": 3700,
"valid_targets_mean": 7662.8,
"valid_targets_min": 6781
},
{
"epoch": 6.511423550087874,
"grad_norm": 0.2997259977928076,
"learning_rate": 5.951226536512278e-07,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2773165702819824,
"step": 3705,
"valid_targets_mean": 7742.9,
"valid_targets_min": 6895
},
{
"epoch": 6.520210896309314,
"grad_norm": 0.32133966328124486,
"learning_rate": 5.740849547480576e-07,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966843247413635,
"step": 3710,
"valid_targets_mean": 7586.9,
"valid_targets_min": 6442
},
{
"epoch": 6.528998242530756,
"grad_norm": 0.286972029950041,
"learning_rate": 5.534204067866178e-07,
"loss": 0.2839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870764434337616,
"step": 3715,
"valid_targets_mean": 8555.6,
"valid_targets_min": 6858
},
{
"epoch": 6.537785588752197,
"grad_norm": 0.3173654710056662,
"learning_rate": 5.331294067106618e-07,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28059589862823486,
"step": 3720,
"valid_targets_mean": 7745.3,
"valid_targets_min": 6357
},
{
"epoch": 6.546572934973638,
"grad_norm": 0.30413824614155777,
"learning_rate": 5.132123442884829e-07,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29954957962036133,
"step": 3725,
"valid_targets_mean": 9327.6,
"valid_targets_min": 6934
},
{
"epoch": 6.555360281195079,
"grad_norm": 0.3301537920025548,
"learning_rate": 4.936696021054377e-07,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29152911901474,
"step": 3730,
"valid_targets_mean": 7535.8,
"valid_targets_min": 6846
},
{
"epoch": 6.564147627416521,
"grad_norm": 0.32086744682083185,
"learning_rate": 4.7450155555658794e-07,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28596755862236023,
"step": 3735,
"valid_targets_mean": 7662.6,
"valid_targets_min": 6982
},
{
"epoch": 6.572934973637961,
"grad_norm": 0.3085282182860389,
"learning_rate": 4.557085728395039e-07,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2964562177658081,
"step": 3740,
"valid_targets_mean": 7674.9,
"valid_targets_min": 6779
},
{
"epoch": 6.581722319859402,
"grad_norm": 0.3048089993533843,
"learning_rate": 4.372910149471743e-07,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2835426926612854,
"step": 3745,
"valid_targets_mean": 8123.1,
"valid_targets_min": 6833
},
{
"epoch": 6.590509666080844,
"grad_norm": 0.30328995717816737,
"learning_rate": 4.1924923566108336e-07,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29824134707450867,
"step": 3750,
"valid_targets_mean": 7895.9,
"valid_targets_min": 6334
},
{
"epoch": 6.5992970123022845,
"grad_norm": 0.3237878832597593,
"learning_rate": 4.015835815444158e-07,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29479193687438965,
"step": 3755,
"valid_targets_mean": 7718.5,
"valid_targets_min": 6643
},
{
"epoch": 6.608084358523726,
"grad_norm": 0.3084873991845284,
"learning_rate": 3.842943919353914e-07,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28741276264190674,
"step": 3760,
"valid_targets_mean": 7682.5,
"valid_targets_min": 7047
},
{
"epoch": 6.616871704745167,
"grad_norm": 0.31846598698805506,
"learning_rate": 3.6738199894075454e-07,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2965297996997833,
"step": 3765,
"valid_targets_mean": 7662.4,
"valid_targets_min": 6642
},
{
"epoch": 6.6256590509666085,
"grad_norm": 0.3161130165643001,
"learning_rate": 3.508467274293903e-07,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934122383594513,
"step": 3770,
"valid_targets_mean": 7776.6,
"valid_targets_min": 6906
},
{
"epoch": 6.634446397188049,
"grad_norm": 0.318539965119587,
"learning_rate": 3.3468889502608957e-07,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2931661605834961,
"step": 3775,
"valid_targets_mean": 7592.9,
"valid_targets_min": 7114
},
{
"epoch": 6.643233743409491,
"grad_norm": 0.3299262714481787,
"learning_rate": 3.1890881210543625e-07,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29032421112060547,
"step": 3780,
"valid_targets_mean": 7454.5,
"valid_targets_min": 5869
},
{
"epoch": 6.6520210896309315,
"grad_norm": 0.33860570015403696,
"learning_rate": 3.0350678178585834e-07,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29499220848083496,
"step": 3785,
"valid_targets_mean": 7219.4,
"valid_targets_min": 787
},
{
"epoch": 6.660808435852372,
"grad_norm": 0.3087571948862897,
"learning_rate": 2.884830999237953e-07,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27930399775505066,
"step": 3790,
"valid_targets_mean": 7931.0,
"valid_targets_min": 6713
},
{
"epoch": 6.669595782073814,
"grad_norm": 0.3040127214705321,
"learning_rate": 2.7383805510802884e-07,
"loss": 0.2884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921474575996399,
"step": 3795,
"valid_targets_mean": 7779.0,
"valid_targets_min": 6741
},
{
"epoch": 6.678383128295255,
"grad_norm": 0.3383204812705453,
"learning_rate": 2.5957192865411653e-07,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2986317574977875,
"step": 3800,
"valid_targets_mean": 7771.4,
"valid_targets_min": 6909
},
{
"epoch": 6.687170474516696,
"grad_norm": 0.3145720712599281,
"learning_rate": 2.4568499459901585e-07,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2892332673072815,
"step": 3805,
"valid_targets_mean": 7687.5,
"valid_targets_min": 6181
},
{
"epoch": 6.695957820738137,
"grad_norm": 0.3076130863525781,
"learning_rate": 2.3217751969579315e-07,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29126110672950745,
"step": 3810,
"valid_targets_mean": 7834.6,
"valid_targets_min": 6803
},
{
"epoch": 6.704745166959579,
"grad_norm": 0.29341564576186163,
"learning_rate": 2.1904976340852535e-07,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2846061587333679,
"step": 3815,
"valid_targets_mean": 9068.6,
"valid_targets_min": 7232
},
{
"epoch": 6.713532513181019,
"grad_norm": 0.32891744732904976,
"learning_rate": 2.0630197790728834e-07,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2955701947212219,
"step": 3820,
"valid_targets_mean": 7397.4,
"valid_targets_min": 3926
},
{
"epoch": 6.722319859402461,
"grad_norm": 0.30423508236207003,
"learning_rate": 1.9393440806334096e-07,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28711095452308655,
"step": 3825,
"valid_targets_mean": 7855.9,
"valid_targets_min": 7202
},
{
"epoch": 6.731107205623902,
"grad_norm": 0.2903631980463757,
"learning_rate": 1.819472914443998e-07,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27378320693969727,
"step": 3830,
"valid_targets_mean": 8380.3,
"valid_targets_min": 7309
},
{
"epoch": 6.739894551845342,
"grad_norm": 0.3046077789434804,
"learning_rate": 1.7034085831008962e-07,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29257017374038696,
"step": 3835,
"valid_targets_mean": 8174.4,
"valid_targets_min": 7042
},
{
"epoch": 6.748681898066784,
"grad_norm": 0.32891229467930705,
"learning_rate": 1.5911533160750668e-07,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2956711947917938,
"step": 3840,
"valid_targets_mean": 7624.0,
"valid_targets_min": 6117
},
{
"epoch": 6.757469244288225,
"grad_norm": 0.32114057955257985,
"learning_rate": 1.4827092696695578e-07,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28788745403289795,
"step": 3845,
"valid_targets_mean": 7714.6,
"valid_targets_min": 7214
},
{
"epoch": 6.766256590509666,
"grad_norm": 0.309070622824398,
"learning_rate": 1.3780785269778662e-07,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2973918914794922,
"step": 3850,
"valid_targets_mean": 7914.4,
"valid_targets_min": 7277
},
{
"epoch": 6.775043936731107,
"grad_norm": 0.30444702757635617,
"learning_rate": 1.2772630978440836e-07,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28852379322052,
"step": 3855,
"valid_targets_mean": 8496.9,
"valid_targets_min": 6456
},
{
"epoch": 6.783831282952549,
"grad_norm": 0.31099725831636593,
"learning_rate": 1.1802649188241921e-07,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.301106333732605,
"step": 3860,
"valid_targets_mean": 8705.3,
"valid_targets_min": 7320
},
{
"epoch": 6.792618629173989,
"grad_norm": 0.3061079171087977,
"learning_rate": 1.087085853148917e-07,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869272530078888,
"step": 3865,
"valid_targets_mean": 7711.6,
"valid_targets_min": 6146
},
{
"epoch": 6.801405975395431,
"grad_norm": 0.31187087252494716,
"learning_rate": 9.97727690687933e-08,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869059443473816,
"step": 3870,
"valid_targets_mean": 7796.6,
"valid_targets_min": 6426
},
{
"epoch": 6.810193321616872,
"grad_norm": 0.2948395711008696,
"learning_rate": 9.121921479154694e-08,
"loss": 0.2859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28761497139930725,
"step": 3875,
"valid_targets_mean": 8341.2,
"valid_targets_min": 6642
},
{
"epoch": 6.8189806678383125,
"grad_norm": 0.3267583846230294,
"learning_rate": 8.30480867877359e-08,
"loss": 0.293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30055350065231323,
"step": 3880,
"valid_targets_mean": 8443.2,
"valid_targets_min": 7058
},
{
"epoch": 6.827768014059754,
"grad_norm": 0.33397140582769613,
"learning_rate": 7.525954201593966e-08,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2964109778404236,
"step": 3885,
"valid_targets_mean": 7824.0,
"valid_targets_min": 7005
},
{
"epoch": 6.836555360281195,
"grad_norm": 0.28970904880913834,
"learning_rate": 6.785373008573181e-08,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27363112568855286,
"step": 3890,
"valid_targets_mean": 7667.0,
"valid_targets_min": 7054
},
{
"epoch": 6.845342706502636,
"grad_norm": 0.330650600657506,
"learning_rate": 6.083079325479357e-08,
"loss": 0.2926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953321933746338,
"step": 3895,
"valid_targets_mean": 7530.6,
"valid_targets_min": 6828
},
{
"epoch": 6.854130052724077,
"grad_norm": 0.31587378767103247,
"learning_rate": 5.4190866426195866e-08,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28235381841659546,
"step": 3900,
"valid_targets_mean": 7967.4,
"valid_targets_min": 7182
},
{
"epoch": 6.862917398945519,
"grad_norm": 0.33377421716490563,
"learning_rate": 4.793407714579035e-08,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27941250801086426,
"step": 3905,
"valid_targets_mean": 7071.4,
"valid_targets_min": 764
},
{
"epoch": 6.8717047451669595,
"grad_norm": 0.31805688656222625,
"learning_rate": 4.2060545599773574e-08,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2866838276386261,
"step": 3910,
"valid_targets_mean": 7444.9,
"valid_targets_min": 6530
},
{
"epoch": 6.880492091388401,
"grad_norm": 0.30469628346307415,
"learning_rate": 3.6570384612368834e-08,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791711091995239,
"step": 3915,
"valid_targets_mean": 7580.8,
"valid_targets_min": 6620
},
{
"epoch": 6.889279437609842,
"grad_norm": 0.2982641769682887,
"learning_rate": 3.146369964366791e-08,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27555572986602783,
"step": 3920,
"valid_targets_mean": 8302.6,
"valid_targets_min": 7055
},
{
"epoch": 6.898066783831283,
"grad_norm": 0.27981864432775694,
"learning_rate": 2.674058878759933e-08,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29031240940093994,
"step": 3925,
"valid_targets_mean": 9336.2,
"valid_targets_min": 6065
},
{
"epoch": 6.906854130052724,
"grad_norm": 0.31699318487313444,
"learning_rate": 2.240114277004324e-08,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884048521518707,
"step": 3930,
"valid_targets_mean": 7750.0,
"valid_targets_min": 6825
},
{
"epoch": 6.915641476274165,
"grad_norm": 0.3150763779616322,
"learning_rate": 1.844544494709277e-08,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2877803444862366,
"step": 3935,
"valid_targets_mean": 7871.9,
"valid_targets_min": 6823
},
{
"epoch": 6.9244288224956065,
"grad_norm": 0.3012630929462455,
"learning_rate": 1.4873571303448687e-08,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717800438404083,
"step": 3940,
"valid_targets_mean": 7653.2,
"valid_targets_min": 6664
},
{
"epoch": 6.933216168717047,
"grad_norm": 0.317214261259486,
"learning_rate": 1.1685590450962736e-08,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28537219762802124,
"step": 3945,
"valid_targets_mean": 7671.8,
"valid_targets_min": 6867
},
{
"epoch": 6.942003514938489,
"grad_norm": 0.29991630247313383,
"learning_rate": 8.881563627320955e-09,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27608373761177063,
"step": 3950,
"valid_targets_mean": 7615.9,
"valid_targets_min": 6974
},
{
"epoch": 6.95079086115993,
"grad_norm": 0.2959598145640836,
"learning_rate": 6.461544694864596e-09,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29918140172958374,
"step": 3955,
"valid_targets_mean": 8303.6,
"valid_targets_min": 6911
},
{
"epoch": 6.959578207381371,
"grad_norm": 0.30081974960794616,
"learning_rate": 4.4255801395554075e-09,
"loss": 0.2889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28856515884399414,
"step": 3960,
"valid_targets_mean": 9260.8,
"valid_targets_min": 7282
},
{
"epoch": 6.968365553602812,
"grad_norm": 0.32922681699591744,
"learning_rate": 2.773709070080788e-09,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29428255558013916,
"step": 3965,
"valid_targets_mean": 7888.9,
"valid_targets_min": 6834
},
{
"epoch": 6.977152899824253,
"grad_norm": 0.31492340742066066,
"learning_rate": 1.5059632171099402e-09,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29231247305870056,
"step": 3970,
"valid_targets_mean": 7748.9,
"valid_targets_min": 967
},
{
"epoch": 6.985940246045694,
"grad_norm": 0.30231619440695345,
"learning_rate": 6.22366932676588e-10,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29516685009002686,
"step": 3975,
"valid_targets_mean": 8495.4,
"valid_targets_min": 6964
},
{
"epoch": 6.994727592267135,
"grad_norm": 0.2997116532045884,
"learning_rate": 1.229371897149001e-10,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2693384289741516,
"step": 3980,
"valid_targets_mean": 7885.3,
"valid_targets_min": 7269
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2778266668319702,
"step": 3983,
"total_flos": 1690778105544704.0,
"train_loss": 0.31329786029258266,
"train_runtime": 27268.6753,
"train_samples_per_second": 2.334,
"train_steps_per_second": 0.146,
"valid_targets_mean": 7882.6,
"valid_targets_min": 6749
}
],
"logging_steps": 5,
"max_steps": 3983,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1690778105544704.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}