Files
e1_gpt_long_sandboxes_2x_ta…/trainer_state.json
ModelHub XC f2421355ca 初始化项目,由ModelHub XC社区提供模型
Model: DCAgent/e1_gpt_long_sandboxes_2x_tacc-Qwen3-8B
Source: Original Platform
2026-04-26 21:07:02 +08:00

20233 lines
562 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 9177,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0038138825324180014,
"grad_norm": 9.470755296878524,
"learning_rate": 1.7429193899782138e-07,
"loss": 0.8166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8353788256645203,
"step": 5,
"valid_targets_mean": 5229.4,
"valid_targets_min": 1152
},
{
"epoch": 0.007627765064836003,
"grad_norm": 11.999543819314578,
"learning_rate": 3.921568627450981e-07,
"loss": 0.8786,
"loss_nan_ranks": 0,
"loss_rank_avg": 1.0028491020202637,
"step": 10,
"valid_targets_mean": 3283.0,
"valid_targets_min": 660
},
{
"epoch": 0.011441647597254004,
"grad_norm": 10.891241780249842,
"learning_rate": 6.100217864923748e-07,
"loss": 0.8257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8274946212768555,
"step": 15,
"valid_targets_mean": 4470.2,
"valid_targets_min": 1025
},
{
"epoch": 0.015255530129672006,
"grad_norm": 9.997792672692631,
"learning_rate": 8.278867102396515e-07,
"loss": 0.8311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.8327676653862,
"step": 20,
"valid_targets_mean": 4210.0,
"valid_targets_min": 345
},
{
"epoch": 0.01906941266209001,
"grad_norm": 8.877819827048429,
"learning_rate": 1.0457516339869283e-06,
"loss": 0.8057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7901816964149475,
"step": 25,
"valid_targets_mean": 4130.4,
"valid_targets_min": 1404
},
{
"epoch": 0.02288329519450801,
"grad_norm": 8.096441526748734,
"learning_rate": 1.2636165577342049e-06,
"loss": 0.808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7575476765632629,
"step": 30,
"valid_targets_mean": 3961.3,
"valid_targets_min": 1118
},
{
"epoch": 0.02669717772692601,
"grad_norm": 5.796639402961682,
"learning_rate": 1.4814814814814815e-06,
"loss": 0.7743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7839180827140808,
"step": 35,
"valid_targets_mean": 4570.6,
"valid_targets_min": 782
},
{
"epoch": 0.03051106025934401,
"grad_norm": 4.5778398820035555,
"learning_rate": 1.6993464052287585e-06,
"loss": 0.7824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7421620488166809,
"step": 40,
"valid_targets_mean": 4959.4,
"valid_targets_min": 1531
},
{
"epoch": 0.034324942791762014,
"grad_norm": 3.104932493714994,
"learning_rate": 1.917211328976035e-06,
"loss": 0.6661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6358296275138855,
"step": 45,
"valid_targets_mean": 4961.0,
"valid_targets_min": 1151
},
{
"epoch": 0.03813882532418002,
"grad_norm": 3.2109157965025417,
"learning_rate": 2.135076252723312e-06,
"loss": 0.6704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6529257297515869,
"step": 50,
"valid_targets_mean": 3586.6,
"valid_targets_min": 449
},
{
"epoch": 0.041952707856598014,
"grad_norm": 2.150373234220549,
"learning_rate": 2.3529411764705885e-06,
"loss": 0.6812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7103098034858704,
"step": 55,
"valid_targets_mean": 4680.6,
"valid_targets_min": 1299
},
{
"epoch": 0.04576659038901602,
"grad_norm": 1.5051584529967943,
"learning_rate": 2.570806100217865e-06,
"loss": 0.6306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6322097778320312,
"step": 60,
"valid_targets_mean": 4604.5,
"valid_targets_min": 833
},
{
"epoch": 0.04958047292143402,
"grad_norm": 1.372839166404494,
"learning_rate": 2.788671023965142e-06,
"loss": 0.623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5981409549713135,
"step": 65,
"valid_targets_mean": 3717.8,
"valid_targets_min": 301
},
{
"epoch": 0.05339435545385202,
"grad_norm": 1.2972075810391417,
"learning_rate": 3.0065359477124182e-06,
"loss": 0.6228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6940057873725891,
"step": 70,
"valid_targets_mean": 3829.6,
"valid_targets_min": 1278
},
{
"epoch": 0.057208237986270026,
"grad_norm": 0.9279377869597232,
"learning_rate": 3.2244008714596952e-06,
"loss": 0.6054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6068126559257507,
"step": 75,
"valid_targets_mean": 5117.9,
"valid_targets_min": 938
},
{
"epoch": 0.06102212051868802,
"grad_norm": 0.9158878206222738,
"learning_rate": 3.4422657952069723e-06,
"loss": 0.5969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5890101790428162,
"step": 80,
"valid_targets_mean": 4001.0,
"valid_targets_min": 768
},
{
"epoch": 0.06483600305110603,
"grad_norm": 0.8582325602905675,
"learning_rate": 3.6601307189542484e-06,
"loss": 0.5925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.616851806640625,
"step": 85,
"valid_targets_mean": 4640.2,
"valid_targets_min": 956
},
{
"epoch": 0.06864988558352403,
"grad_norm": 0.8125076785088601,
"learning_rate": 3.8779956427015254e-06,
"loss": 0.5796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5934779644012451,
"step": 90,
"valid_targets_mean": 4000.2,
"valid_targets_min": 1232
},
{
"epoch": 0.07246376811594203,
"grad_norm": 0.6943712006747517,
"learning_rate": 4.0958605664488025e-06,
"loss": 0.5544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5483887195587158,
"step": 95,
"valid_targets_mean": 4390.5,
"valid_targets_min": 659
},
{
"epoch": 0.07627765064836003,
"grad_norm": 0.6230323834581825,
"learning_rate": 4.313725490196079e-06,
"loss": 0.5606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5412846803665161,
"step": 100,
"valid_targets_mean": 4160.7,
"valid_targets_min": 972
},
{
"epoch": 0.08009153318077804,
"grad_norm": 0.875591747930727,
"learning_rate": 4.531590413943356e-06,
"loss": 0.525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49036863446235657,
"step": 105,
"valid_targets_mean": 3680.2,
"valid_targets_min": 1247
},
{
"epoch": 0.08390541571319603,
"grad_norm": 0.5510216943897367,
"learning_rate": 4.749455337690632e-06,
"loss": 0.5576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4874543249607086,
"step": 110,
"valid_targets_mean": 4145.7,
"valid_targets_min": 1149
},
{
"epoch": 0.08771929824561403,
"grad_norm": 0.5426893613443619,
"learning_rate": 4.967320261437909e-06,
"loss": 0.5387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5104167461395264,
"step": 115,
"valid_targets_mean": 4632.5,
"valid_targets_min": 1081
},
{
"epoch": 0.09153318077803203,
"grad_norm": 0.551676285668215,
"learning_rate": 5.185185185185185e-06,
"loss": 0.5484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5294644236564636,
"step": 120,
"valid_targets_mean": 4924.3,
"valid_targets_min": 1112
},
{
"epoch": 0.09534706331045004,
"grad_norm": 0.5270524880611899,
"learning_rate": 5.403050108932463e-06,
"loss": 0.5164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44165608286857605,
"step": 125,
"valid_targets_mean": 4687.0,
"valid_targets_min": 1765
},
{
"epoch": 0.09916094584286804,
"grad_norm": 0.48986406955989537,
"learning_rate": 5.620915032679739e-06,
"loss": 0.4987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4905380308628082,
"step": 130,
"valid_targets_mean": 4783.9,
"valid_targets_min": 872
},
{
"epoch": 0.10297482837528604,
"grad_norm": 0.5186763368356251,
"learning_rate": 5.838779956427015e-06,
"loss": 0.52,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5089920163154602,
"step": 135,
"valid_targets_mean": 4795.2,
"valid_targets_min": 1039
},
{
"epoch": 0.10678871090770405,
"grad_norm": 0.5010334333520292,
"learning_rate": 6.056644880174293e-06,
"loss": 0.5146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5307483673095703,
"step": 140,
"valid_targets_mean": 5161.2,
"valid_targets_min": 1295
},
{
"epoch": 0.11060259344012205,
"grad_norm": 0.5123633336801784,
"learning_rate": 6.274509803921569e-06,
"loss": 0.5178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4454838037490845,
"step": 145,
"valid_targets_mean": 3884.6,
"valid_targets_min": 1002
},
{
"epoch": 0.11441647597254005,
"grad_norm": 0.5491751275251507,
"learning_rate": 6.492374727668845e-06,
"loss": 0.4921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5181975364685059,
"step": 150,
"valid_targets_mean": 4045.0,
"valid_targets_min": 1020
},
{
"epoch": 0.11823035850495804,
"grad_norm": 2.500737350039349,
"learning_rate": 6.710239651416122e-06,
"loss": 0.4828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4583951532840729,
"step": 155,
"valid_targets_mean": 4955.4,
"valid_targets_min": 1056
},
{
"epoch": 0.12204424103737604,
"grad_norm": 0.4536799712131569,
"learning_rate": 6.928104575163399e-06,
"loss": 0.501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45491790771484375,
"step": 160,
"valid_targets_mean": 4887.3,
"valid_targets_min": 1317
},
{
"epoch": 0.12585812356979406,
"grad_norm": 0.5705305236405581,
"learning_rate": 7.145969498910676e-06,
"loss": 0.7423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4795728921890259,
"step": 165,
"valid_targets_mean": 3697.1,
"valid_targets_min": 433
},
{
"epoch": 0.12967200610221205,
"grad_norm": 0.5378675959231818,
"learning_rate": 7.363834422657953e-06,
"loss": 0.5011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4969773292541504,
"step": 170,
"valid_targets_mean": 4247.1,
"valid_targets_min": 939
},
{
"epoch": 0.13348588863463004,
"grad_norm": 0.5413191072539879,
"learning_rate": 7.581699346405229e-06,
"loss": 0.4931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46094343066215515,
"step": 175,
"valid_targets_mean": 3648.6,
"valid_targets_min": 1373
},
{
"epoch": 0.13729977116704806,
"grad_norm": 0.4947370912132374,
"learning_rate": 7.799564270152506e-06,
"loss": 0.5081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43682071566581726,
"step": 180,
"valid_targets_mean": 3943.0,
"valid_targets_min": 990
},
{
"epoch": 0.14111365369946605,
"grad_norm": 0.5277722158585259,
"learning_rate": 8.017429193899784e-06,
"loss": 0.4734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4734993875026703,
"step": 185,
"valid_targets_mean": 4291.0,
"valid_targets_min": 1033
},
{
"epoch": 0.14492753623188406,
"grad_norm": 0.5624419217272335,
"learning_rate": 8.23529411764706e-06,
"loss": 0.4905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46875128149986267,
"step": 190,
"valid_targets_mean": 3662.4,
"valid_targets_min": 874
},
{
"epoch": 0.14874141876430205,
"grad_norm": 0.49793152277491554,
"learning_rate": 8.453159041394336e-06,
"loss": 0.4859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47551751136779785,
"step": 195,
"valid_targets_mean": 4590.5,
"valid_targets_min": 934
},
{
"epoch": 0.15255530129672007,
"grad_norm": 0.47365481578115076,
"learning_rate": 8.671023965141612e-06,
"loss": 0.4974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.509818971157074,
"step": 200,
"valid_targets_mean": 5085.7,
"valid_targets_min": 1068
},
{
"epoch": 0.15636918382913806,
"grad_norm": 0.5712494209301259,
"learning_rate": 8.888888888888888e-06,
"loss": 0.4751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4649386405944824,
"step": 205,
"valid_targets_mean": 3302.5,
"valid_targets_min": 1013
},
{
"epoch": 0.16018306636155608,
"grad_norm": 0.5084803651986027,
"learning_rate": 9.106753812636166e-06,
"loss": 0.4449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.473945289850235,
"step": 210,
"valid_targets_mean": 4434.8,
"valid_targets_min": 1002
},
{
"epoch": 0.16399694889397406,
"grad_norm": 0.5184435672003983,
"learning_rate": 9.324618736383442e-06,
"loss": 0.4346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3982456624507904,
"step": 215,
"valid_targets_mean": 3852.2,
"valid_targets_min": 870
},
{
"epoch": 0.16781083142639205,
"grad_norm": 0.4868051846661637,
"learning_rate": 9.54248366013072e-06,
"loss": 0.4829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48539039492607117,
"step": 220,
"valid_targets_mean": 6059.0,
"valid_targets_min": 865
},
{
"epoch": 0.17162471395881007,
"grad_norm": 0.5409139800606549,
"learning_rate": 9.760348583877996e-06,
"loss": 0.4629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47836971282958984,
"step": 225,
"valid_targets_mean": 4304.7,
"valid_targets_min": 890
},
{
"epoch": 0.17543859649122806,
"grad_norm": 0.5009648662623246,
"learning_rate": 9.978213507625273e-06,
"loss": 0.4451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4605931043624878,
"step": 230,
"valid_targets_mean": 5225.0,
"valid_targets_min": 1847
},
{
"epoch": 0.17925247902364608,
"grad_norm": 0.5140950082674012,
"learning_rate": 1.0196078431372549e-05,
"loss": 0.4662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43352267146110535,
"step": 235,
"valid_targets_mean": 5232.6,
"valid_targets_min": 1525
},
{
"epoch": 0.18306636155606407,
"grad_norm": 0.579977428231358,
"learning_rate": 1.0413943355119827e-05,
"loss": 0.4508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4714777171611786,
"step": 240,
"valid_targets_mean": 4931.0,
"valid_targets_min": 1398
},
{
"epoch": 0.18688024408848208,
"grad_norm": 0.5864749503460456,
"learning_rate": 1.0631808278867104e-05,
"loss": 0.4469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4570702612400055,
"step": 245,
"valid_targets_mean": 4803.3,
"valid_targets_min": 787
},
{
"epoch": 0.19069412662090007,
"grad_norm": 0.4372149960084067,
"learning_rate": 1.0849673202614379e-05,
"loss": 0.4472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42177343368530273,
"step": 250,
"valid_targets_mean": 5634.1,
"valid_targets_min": 1214
},
{
"epoch": 0.1945080091533181,
"grad_norm": 0.5238824399942199,
"learning_rate": 1.1067538126361657e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40550434589385986,
"step": 255,
"valid_targets_mean": 4041.0,
"valid_targets_min": 1198
},
{
"epoch": 0.19832189168573608,
"grad_norm": 0.5263090103192474,
"learning_rate": 1.1285403050108935e-05,
"loss": 0.4491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4669533669948578,
"step": 260,
"valid_targets_mean": 4864.0,
"valid_targets_min": 348
},
{
"epoch": 0.20213577421815407,
"grad_norm": 0.4844855824860165,
"learning_rate": 1.1503267973856209e-05,
"loss": 0.4356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4767606556415558,
"step": 265,
"valid_targets_mean": 4571.4,
"valid_targets_min": 1294
},
{
"epoch": 0.20594965675057209,
"grad_norm": 0.5844330632392677,
"learning_rate": 1.1721132897603487e-05,
"loss": 0.4694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5140058398246765,
"step": 270,
"valid_targets_mean": 3920.4,
"valid_targets_min": 934
},
{
"epoch": 0.20976353928299007,
"grad_norm": 0.528817963711389,
"learning_rate": 1.1938997821350765e-05,
"loss": 0.4432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4353533089160919,
"step": 275,
"valid_targets_mean": 4601.6,
"valid_targets_min": 863
},
{
"epoch": 0.2135774218154081,
"grad_norm": 0.5006857035283947,
"learning_rate": 1.215686274509804e-05,
"loss": 0.461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4613196551799774,
"step": 280,
"valid_targets_mean": 4929.3,
"valid_targets_min": 981
},
{
"epoch": 0.21739130434782608,
"grad_norm": 0.47435927216376855,
"learning_rate": 1.2374727668845317e-05,
"loss": 0.4646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4284130334854126,
"step": 285,
"valid_targets_mean": 4549.0,
"valid_targets_min": 1071
},
{
"epoch": 0.2212051868802441,
"grad_norm": 0.48912815677244226,
"learning_rate": 1.2592592592592593e-05,
"loss": 0.441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.438406378030777,
"step": 290,
"valid_targets_mean": 4591.1,
"valid_targets_min": 1050
},
{
"epoch": 0.2250190694126621,
"grad_norm": 0.4913986455786091,
"learning_rate": 1.281045751633987e-05,
"loss": 0.4563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.485249787569046,
"step": 295,
"valid_targets_mean": 4955.3,
"valid_targets_min": 935
},
{
"epoch": 0.2288329519450801,
"grad_norm": 0.47839058332511075,
"learning_rate": 1.3028322440087147e-05,
"loss": 0.4757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45996996760368347,
"step": 300,
"valid_targets_mean": 4854.8,
"valid_targets_min": 1379
},
{
"epoch": 0.2326468344774981,
"grad_norm": 0.5908371229215295,
"learning_rate": 1.3246187363834424e-05,
"loss": 0.4286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4527187645435333,
"step": 305,
"valid_targets_mean": 4125.8,
"valid_targets_min": 1221
},
{
"epoch": 0.23646071700991608,
"grad_norm": 0.558504394945239,
"learning_rate": 1.3464052287581701e-05,
"loss": 0.4645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46870169043540955,
"step": 310,
"valid_targets_mean": 4148.9,
"valid_targets_min": 1389
},
{
"epoch": 0.2402745995423341,
"grad_norm": 0.5561787164121977,
"learning_rate": 1.3681917211328976e-05,
"loss": 0.4245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.407299280166626,
"step": 315,
"valid_targets_mean": 3703.2,
"valid_targets_min": 1119
},
{
"epoch": 0.2440884820747521,
"grad_norm": 0.5406060809535468,
"learning_rate": 1.3899782135076254e-05,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3715898096561432,
"step": 320,
"valid_targets_mean": 4031.1,
"valid_targets_min": 1148
},
{
"epoch": 0.2479023646071701,
"grad_norm": 1.4983453657518973,
"learning_rate": 1.4117647058823532e-05,
"loss": 0.5043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6690896153450012,
"step": 325,
"valid_targets_mean": 1204.7,
"valid_targets_min": 562
},
{
"epoch": 0.2517162471395881,
"grad_norm": 0.9150855492826523,
"learning_rate": 1.4335511982570806e-05,
"loss": 0.7726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5599314570426941,
"step": 330,
"valid_targets_mean": 1777.9,
"valid_targets_min": 629
},
{
"epoch": 0.2555301296720061,
"grad_norm": 0.5586598650153595,
"learning_rate": 1.4553376906318084e-05,
"loss": 0.4435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44297829270362854,
"step": 335,
"valid_targets_mean": 4019.2,
"valid_targets_min": 610
},
{
"epoch": 0.2593440122044241,
"grad_norm": 0.5304240978755225,
"learning_rate": 1.4771241830065362e-05,
"loss": 0.4227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3744999170303345,
"step": 340,
"valid_targets_mean": 4157.5,
"valid_targets_min": 1035
},
{
"epoch": 0.2631578947368421,
"grad_norm": 0.669155831706647,
"learning_rate": 1.4989106753812636e-05,
"loss": 0.4595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4575551450252533,
"step": 345,
"valid_targets_mean": 5283.3,
"valid_targets_min": 1131
},
{
"epoch": 0.2669717772692601,
"grad_norm": 0.6703382325755647,
"learning_rate": 1.5206971677559914e-05,
"loss": 0.4406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4503791332244873,
"step": 350,
"valid_targets_mean": 3426.8,
"valid_targets_min": 1044
},
{
"epoch": 0.2707856598016781,
"grad_norm": 0.5788534308575273,
"learning_rate": 1.5424836601307192e-05,
"loss": 0.4515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43128445744514465,
"step": 355,
"valid_targets_mean": 4059.3,
"valid_targets_min": 385
},
{
"epoch": 0.2745995423340961,
"grad_norm": 0.5167153063531891,
"learning_rate": 1.5642701525054468e-05,
"loss": 0.438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4530758559703827,
"step": 360,
"valid_targets_mean": 4845.2,
"valid_targets_min": 978
},
{
"epoch": 0.2784134248665141,
"grad_norm": 0.5271031423011994,
"learning_rate": 1.5860566448801744e-05,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41743603348731995,
"step": 365,
"valid_targets_mean": 3877.2,
"valid_targets_min": 468
},
{
"epoch": 0.2822273073989321,
"grad_norm": 0.4584127185198121,
"learning_rate": 1.607843137254902e-05,
"loss": 0.4311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3872661590576172,
"step": 370,
"valid_targets_mean": 4894.0,
"valid_targets_min": 1049
},
{
"epoch": 0.28604118993135014,
"grad_norm": 0.5674756040704212,
"learning_rate": 1.6296296296296297e-05,
"loss": 0.4269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4131319522857666,
"step": 375,
"valid_targets_mean": 4604.5,
"valid_targets_min": 1024
},
{
"epoch": 0.2898550724637681,
"grad_norm": 0.49939284790297844,
"learning_rate": 1.6514161220043573e-05,
"loss": 0.413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4175918996334076,
"step": 380,
"valid_targets_mean": 4370.5,
"valid_targets_min": 1018
},
{
"epoch": 0.2936689549961861,
"grad_norm": 0.5308498919223146,
"learning_rate": 1.6732026143790852e-05,
"loss": 0.4101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41098570823669434,
"step": 385,
"valid_targets_mean": 3836.2,
"valid_targets_min": 336
},
{
"epoch": 0.2974828375286041,
"grad_norm": 0.5122991151701906,
"learning_rate": 1.6949891067538125e-05,
"loss": 0.4106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4084223508834839,
"step": 390,
"valid_targets_mean": 4162.0,
"valid_targets_min": 1472
},
{
"epoch": 0.3012967200610221,
"grad_norm": 0.5181967092269961,
"learning_rate": 1.7167755991285405e-05,
"loss": 0.4204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3865543305873871,
"step": 395,
"valid_targets_mean": 4125.0,
"valid_targets_min": 1314
},
{
"epoch": 0.30511060259344014,
"grad_norm": 0.5550861402134036,
"learning_rate": 1.738562091503268e-05,
"loss": 0.4397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4710928499698639,
"step": 400,
"valid_targets_mean": 4019.8,
"valid_targets_min": 1289
},
{
"epoch": 0.30892448512585813,
"grad_norm": 0.5438815034414402,
"learning_rate": 1.7603485838779957e-05,
"loss": 0.4228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3929981291294098,
"step": 405,
"valid_targets_mean": 4301.6,
"valid_targets_min": 504
},
{
"epoch": 0.3127383676582761,
"grad_norm": 0.6707002167342581,
"learning_rate": 1.7821350762527233e-05,
"loss": 0.4142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.422780841588974,
"step": 410,
"valid_targets_mean": 4865.9,
"valid_targets_min": 1739
},
{
"epoch": 0.3165522501906941,
"grad_norm": 2.032523055369547,
"learning_rate": 1.8039215686274513e-05,
"loss": 0.426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49667227268218994,
"step": 415,
"valid_targets_mean": 3822.7,
"valid_targets_min": 674
},
{
"epoch": 0.32036613272311215,
"grad_norm": 0.5997322470060125,
"learning_rate": 1.825708061002179e-05,
"loss": 0.406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4212714731693268,
"step": 420,
"valid_targets_mean": 3495.9,
"valid_targets_min": 274
},
{
"epoch": 0.32418001525553014,
"grad_norm": 0.48011386623091284,
"learning_rate": 1.8474945533769065e-05,
"loss": 0.405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3752917945384979,
"step": 425,
"valid_targets_mean": 4413.0,
"valid_targets_min": 1244
},
{
"epoch": 0.32799389778794813,
"grad_norm": 0.6028412606566115,
"learning_rate": 1.869281045751634e-05,
"loss": 0.4314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.46982622146606445,
"step": 430,
"valid_targets_mean": 4495.7,
"valid_targets_min": 919
},
{
"epoch": 0.3318077803203661,
"grad_norm": 0.5807673150953151,
"learning_rate": 1.8910675381263617e-05,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41810181736946106,
"step": 435,
"valid_targets_mean": 4100.7,
"valid_targets_min": 1543
},
{
"epoch": 0.3356216628527841,
"grad_norm": 0.5678000717779615,
"learning_rate": 1.9128540305010894e-05,
"loss": 0.4058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4434739351272583,
"step": 440,
"valid_targets_mean": 3935.1,
"valid_targets_min": 890
},
{
"epoch": 0.33943554538520215,
"grad_norm": 0.5469056120801911,
"learning_rate": 1.9346405228758173e-05,
"loss": 0.4116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37859591841697693,
"step": 445,
"valid_targets_mean": 3676.0,
"valid_targets_min": 1351
},
{
"epoch": 0.34324942791762014,
"grad_norm": 0.47827617322788585,
"learning_rate": 1.956427015250545e-05,
"loss": 0.4327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4103635847568512,
"step": 450,
"valid_targets_mean": 5130.5,
"valid_targets_min": 1279
},
{
"epoch": 0.34706331045003813,
"grad_norm": 0.6941453851155629,
"learning_rate": 1.9782135076252725e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4146636724472046,
"step": 455,
"valid_targets_mean": 4593.5,
"valid_targets_min": 1281
},
{
"epoch": 0.3508771929824561,
"grad_norm": 0.5241578671868445,
"learning_rate": 2e-05,
"loss": 0.4178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4084761142730713,
"step": 460,
"valid_targets_mean": 4143.6,
"valid_targets_min": 1026
},
{
"epoch": 0.35469107551487417,
"grad_norm": 0.4946580310260773,
"learning_rate": 2.0217864923747278e-05,
"loss": 0.405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3879587948322296,
"step": 465,
"valid_targets_mean": 4280.2,
"valid_targets_min": 1094
},
{
"epoch": 0.35850495804729215,
"grad_norm": 0.5261377997096447,
"learning_rate": 2.0435729847494557e-05,
"loss": 0.4033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4153151512145996,
"step": 470,
"valid_targets_mean": 4111.7,
"valid_targets_min": 1306
},
{
"epoch": 0.36231884057971014,
"grad_norm": 0.49667981369723574,
"learning_rate": 2.0653594771241834e-05,
"loss": 0.4098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3661862313747406,
"step": 475,
"valid_targets_mean": 4103.8,
"valid_targets_min": 447
},
{
"epoch": 0.36613272311212813,
"grad_norm": 0.5674990532031673,
"learning_rate": 2.0871459694989106e-05,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42640629410743713,
"step": 480,
"valid_targets_mean": 3842.2,
"valid_targets_min": 395
},
{
"epoch": 0.3699466056445461,
"grad_norm": 0.49164681714558667,
"learning_rate": 2.1089324618736386e-05,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36857786774635315,
"step": 485,
"valid_targets_mean": 4493.4,
"valid_targets_min": 1671
},
{
"epoch": 0.37376048817696417,
"grad_norm": 1.1112103673444507,
"learning_rate": 2.1307189542483662e-05,
"loss": 0.4382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5883781313896179,
"step": 490,
"valid_targets_mean": 1448.0,
"valid_targets_min": 675
},
{
"epoch": 0.37757437070938216,
"grad_norm": 0.6359095779716393,
"learning_rate": 2.1525054466230938e-05,
"loss": 0.5499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4046311378479004,
"step": 495,
"valid_targets_mean": 4003.0,
"valid_targets_min": 1379
},
{
"epoch": 0.38138825324180015,
"grad_norm": 0.4982545028617011,
"learning_rate": 2.1742919389978218e-05,
"loss": 0.4297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4083602726459503,
"step": 500,
"valid_targets_mean": 4638.2,
"valid_targets_min": 1044
},
{
"epoch": 0.38520213577421814,
"grad_norm": 0.48915512583881143,
"learning_rate": 2.1960784313725494e-05,
"loss": 0.4163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41862890124320984,
"step": 505,
"valid_targets_mean": 4827.2,
"valid_targets_min": 416
},
{
"epoch": 0.3890160183066362,
"grad_norm": 0.517221047006931,
"learning_rate": 2.2178649237472767e-05,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4069397449493408,
"step": 510,
"valid_targets_mean": 4566.0,
"valid_targets_min": 1278
},
{
"epoch": 0.39282990083905417,
"grad_norm": 0.5121022744996065,
"learning_rate": 2.2396514161220043e-05,
"loss": 0.4108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43694543838500977,
"step": 515,
"valid_targets_mean": 5045.8,
"valid_targets_min": 1274
},
{
"epoch": 0.39664378337147216,
"grad_norm": 0.4800161727651644,
"learning_rate": 2.2614379084967322e-05,
"loss": 0.4098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.395797997713089,
"step": 520,
"valid_targets_mean": 4706.9,
"valid_targets_min": 1275
},
{
"epoch": 0.40045766590389015,
"grad_norm": 0.46860780726922296,
"learning_rate": 2.28322440087146e-05,
"loss": 0.4059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36623287200927734,
"step": 525,
"valid_targets_mean": 4559.0,
"valid_targets_min": 1282
},
{
"epoch": 0.40427154843630814,
"grad_norm": 0.5113105070608205,
"learning_rate": 2.3050108932461878e-05,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38678622245788574,
"step": 530,
"valid_targets_mean": 4872.2,
"valid_targets_min": 587
},
{
"epoch": 0.4080854309687262,
"grad_norm": 0.4842846017374961,
"learning_rate": 2.3267973856209154e-05,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4049014747142792,
"step": 535,
"valid_targets_mean": 5120.1,
"valid_targets_min": 531
},
{
"epoch": 0.41189931350114417,
"grad_norm": 0.48187699542171236,
"learning_rate": 2.3485838779956427e-05,
"loss": 0.4151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42579174041748047,
"step": 540,
"valid_targets_mean": 5236.5,
"valid_targets_min": 1493
},
{
"epoch": 0.41571319603356216,
"grad_norm": 0.5069904951791335,
"learning_rate": 2.3703703703703703e-05,
"loss": 0.3864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.351409912109375,
"step": 545,
"valid_targets_mean": 4193.8,
"valid_targets_min": 1929
},
{
"epoch": 0.41952707856598015,
"grad_norm": 0.47887731304957243,
"learning_rate": 2.3921568627450983e-05,
"loss": 0.3962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3922696113586426,
"step": 550,
"valid_targets_mean": 4655.1,
"valid_targets_min": 1354
},
{
"epoch": 0.4233409610983982,
"grad_norm": 0.4564867344774318,
"learning_rate": 2.413943355119826e-05,
"loss": 0.4237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3802224397659302,
"step": 555,
"valid_targets_mean": 5557.0,
"valid_targets_min": 1151
},
{
"epoch": 0.4271548436308162,
"grad_norm": 0.5031199121109118,
"learning_rate": 2.4357298474945535e-05,
"loss": 0.3761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33998584747314453,
"step": 560,
"valid_targets_mean": 4495.2,
"valid_targets_min": 999
},
{
"epoch": 0.4309687261632342,
"grad_norm": 0.4928451295329029,
"learning_rate": 2.4575163398692815e-05,
"loss": 0.415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4243813753128052,
"step": 565,
"valid_targets_mean": 4882.1,
"valid_targets_min": 987
},
{
"epoch": 0.43478260869565216,
"grad_norm": 0.5259224766412115,
"learning_rate": 2.479302832244009e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3836231231689453,
"step": 570,
"valid_targets_mean": 4713.7,
"valid_targets_min": 1686
},
{
"epoch": 0.43859649122807015,
"grad_norm": 0.5579901905077622,
"learning_rate": 2.5010893246187364e-05,
"loss": 0.3776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3920012414455414,
"step": 575,
"valid_targets_mean": 3984.4,
"valid_targets_min": 977
},
{
"epoch": 0.4424103737604882,
"grad_norm": 0.5439800495512314,
"learning_rate": 2.5228758169934643e-05,
"loss": 0.37,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33532944321632385,
"step": 580,
"valid_targets_mean": 3737.5,
"valid_targets_min": 354
},
{
"epoch": 0.4462242562929062,
"grad_norm": 0.5662975384921443,
"learning_rate": 2.544662309368192e-05,
"loss": 0.4096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4044320285320282,
"step": 585,
"valid_targets_mean": 3571.9,
"valid_targets_min": 1005
},
{
"epoch": 0.4500381388253242,
"grad_norm": 0.47734947502220565,
"learning_rate": 2.5664488017429196e-05,
"loss": 0.3913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41730186343193054,
"step": 590,
"valid_targets_mean": 5255.7,
"valid_targets_min": 750
},
{
"epoch": 0.45385202135774216,
"grad_norm": 0.46089066500843384,
"learning_rate": 2.5882352941176475e-05,
"loss": 0.3849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35630854964256287,
"step": 595,
"valid_targets_mean": 4318.8,
"valid_targets_min": 1350
},
{
"epoch": 0.4576659038901602,
"grad_norm": 0.533942025808671,
"learning_rate": 2.610021786492375e-05,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39351949095726013,
"step": 600,
"valid_targets_mean": 4463.6,
"valid_targets_min": 1353
},
{
"epoch": 0.4614797864225782,
"grad_norm": 0.620788552352078,
"learning_rate": 2.6318082788671024e-05,
"loss": 0.3986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4100879430770874,
"step": 605,
"valid_targets_mean": 4238.0,
"valid_targets_min": 495
},
{
"epoch": 0.4652936689549962,
"grad_norm": 0.47098349815571094,
"learning_rate": 2.65359477124183e-05,
"loss": 0.417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4212774932384491,
"step": 610,
"valid_targets_mean": 5455.1,
"valid_targets_min": 1228
},
{
"epoch": 0.4691075514874142,
"grad_norm": 0.531495026436975,
"learning_rate": 2.675381263616558e-05,
"loss": 0.4189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41660937666893005,
"step": 615,
"valid_targets_mean": 4546.2,
"valid_targets_min": 1467
},
{
"epoch": 0.47292143401983217,
"grad_norm": 0.49774084718519146,
"learning_rate": 2.6971677559912856e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3917350471019745,
"step": 620,
"valid_targets_mean": 4665.4,
"valid_targets_min": 1231
},
{
"epoch": 0.4767353165522502,
"grad_norm": 0.5223030282822787,
"learning_rate": 2.7189542483660135e-05,
"loss": 0.4062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4286997318267822,
"step": 625,
"valid_targets_mean": 4919.1,
"valid_targets_min": 401
},
{
"epoch": 0.4805491990846682,
"grad_norm": 0.6311171808018544,
"learning_rate": 2.740740740740741e-05,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4223945140838623,
"step": 630,
"valid_targets_mean": 3921.5,
"valid_targets_min": 807
},
{
"epoch": 0.4843630816170862,
"grad_norm": 0.5423403261529165,
"learning_rate": 2.7625272331154684e-05,
"loss": 0.3855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3739047944545746,
"step": 635,
"valid_targets_mean": 3978.4,
"valid_targets_min": 715
},
{
"epoch": 0.4881769641495042,
"grad_norm": 0.5833531419739164,
"learning_rate": 2.784313725490196e-05,
"loss": 0.3851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3918963372707367,
"step": 640,
"valid_targets_mean": 3173.8,
"valid_targets_min": 933
},
{
"epoch": 0.4919908466819222,
"grad_norm": 0.5888665746157846,
"learning_rate": 2.806100217864924e-05,
"loss": 0.4044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40655291080474854,
"step": 645,
"valid_targets_mean": 4044.9,
"valid_targets_min": 1272
},
{
"epoch": 0.4958047292143402,
"grad_norm": 0.6310048168490392,
"learning_rate": 2.8278867102396516e-05,
"loss": 0.3894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40415921807289124,
"step": 650,
"valid_targets_mean": 3122.2,
"valid_targets_min": 457
},
{
"epoch": 0.4996186117467582,
"grad_norm": 0.7447980014403361,
"learning_rate": 2.8496732026143792e-05,
"loss": 0.677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44158491492271423,
"step": 655,
"valid_targets_mean": 2758.2,
"valid_targets_min": 574
},
{
"epoch": 0.5034324942791762,
"grad_norm": 0.5141237643896464,
"learning_rate": 2.8714596949891072e-05,
"loss": 0.3874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4077136516571045,
"step": 660,
"valid_targets_mean": 4658.0,
"valid_targets_min": 1364
},
{
"epoch": 0.5072463768115942,
"grad_norm": 0.6083519366022135,
"learning_rate": 2.8932461873638345e-05,
"loss": 0.3797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3819454610347748,
"step": 665,
"valid_targets_mean": 4113.9,
"valid_targets_min": 815
},
{
"epoch": 0.5110602593440122,
"grad_norm": 0.5293654642242984,
"learning_rate": 2.915032679738562e-05,
"loss": 0.4086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35915103554725647,
"step": 670,
"valid_targets_mean": 4441.2,
"valid_targets_min": 1100
},
{
"epoch": 0.5148741418764302,
"grad_norm": 0.49950432251413246,
"learning_rate": 2.93681917211329e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37206077575683594,
"step": 675,
"valid_targets_mean": 4198.2,
"valid_targets_min": 967
},
{
"epoch": 0.5186880244088482,
"grad_norm": 0.4630265565067862,
"learning_rate": 2.9586056644880177e-05,
"loss": 0.39,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.385885089635849,
"step": 680,
"valid_targets_mean": 5195.9,
"valid_targets_min": 1113
},
{
"epoch": 0.5225019069412662,
"grad_norm": 0.5299093503446665,
"learning_rate": 2.9803921568627453e-05,
"loss": 0.4099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4257817566394806,
"step": 685,
"valid_targets_mean": 3791.5,
"valid_targets_min": 1313
},
{
"epoch": 0.5263157894736842,
"grad_norm": 0.5647217389609704,
"learning_rate": 3.0021786492374732e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4137308895587921,
"step": 690,
"valid_targets_mean": 3960.7,
"valid_targets_min": 844
},
{
"epoch": 0.5301296720061022,
"grad_norm": 0.5278358373812087,
"learning_rate": 3.023965141612201e-05,
"loss": 0.3888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4036301076412201,
"step": 695,
"valid_targets_mean": 4288.9,
"valid_targets_min": 1040
},
{
"epoch": 0.5339435545385202,
"grad_norm": 0.5073909224886175,
"learning_rate": 3.045751633986928e-05,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3536445200443268,
"step": 700,
"valid_targets_mean": 3966.4,
"valid_targets_min": 1084
},
{
"epoch": 0.5377574370709383,
"grad_norm": 0.4830058432421143,
"learning_rate": 3.067538126361656e-05,
"loss": 0.388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4126201868057251,
"step": 705,
"valid_targets_mean": 5077.2,
"valid_targets_min": 1141
},
{
"epoch": 0.5415713196033562,
"grad_norm": 0.47042770960997,
"learning_rate": 3.0893246187363834e-05,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3704334497451782,
"step": 710,
"valid_targets_mean": 4411.2,
"valid_targets_min": 1106
},
{
"epoch": 0.5453852021357742,
"grad_norm": 0.5497176981288221,
"learning_rate": 3.111111111111112e-05,
"loss": 0.3917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3955814838409424,
"step": 715,
"valid_targets_mean": 4098.8,
"valid_targets_min": 881
},
{
"epoch": 0.5491990846681922,
"grad_norm": 0.5024335146851029,
"learning_rate": 3.132897603485839e-05,
"loss": 0.4255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4101240634918213,
"step": 720,
"valid_targets_mean": 4925.6,
"valid_targets_min": 1056
},
{
"epoch": 0.5530129672006102,
"grad_norm": 0.5231997517163126,
"learning_rate": 3.154684095860567e-05,
"loss": 0.3913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4119824469089508,
"step": 725,
"valid_targets_mean": 4464.0,
"valid_targets_min": 1397
},
{
"epoch": 0.5568268497330282,
"grad_norm": 0.5711284191765268,
"learning_rate": 3.1764705882352945e-05,
"loss": 0.3777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3848339319229126,
"step": 730,
"valid_targets_mean": 3427.6,
"valid_targets_min": 850
},
{
"epoch": 0.5606407322654462,
"grad_norm": 0.5389152963467714,
"learning_rate": 3.198257080610022e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3863255977630615,
"step": 735,
"valid_targets_mean": 3456.2,
"valid_targets_min": 928
},
{
"epoch": 0.5644546147978642,
"grad_norm": 0.49151065077688183,
"learning_rate": 3.22004357298475e-05,
"loss": 0.408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3926849365234375,
"step": 740,
"valid_targets_mean": 4422.6,
"valid_targets_min": 1164
},
{
"epoch": 0.5682684973302822,
"grad_norm": 0.4856172845776493,
"learning_rate": 3.2418300653594774e-05,
"loss": 0.3676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4255011975765228,
"step": 745,
"valid_targets_mean": 5380.8,
"valid_targets_min": 1094
},
{
"epoch": 0.5720823798627003,
"grad_norm": 0.4676240103796647,
"learning_rate": 3.263616557734205e-05,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36335039138793945,
"step": 750,
"valid_targets_mean": 5003.5,
"valid_targets_min": 1181
},
{
"epoch": 0.5758962623951183,
"grad_norm": 0.6001473921317693,
"learning_rate": 3.2854030501089326e-05,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4211665689945221,
"step": 755,
"valid_targets_mean": 3523.4,
"valid_targets_min": 652
},
{
"epoch": 0.5797101449275363,
"grad_norm": 0.4595865924313308,
"learning_rate": 3.30718954248366e-05,
"loss": 0.3937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38674649596214294,
"step": 760,
"valid_targets_mean": 4933.9,
"valid_targets_min": 887
},
{
"epoch": 0.5835240274599542,
"grad_norm": 0.5168951363868316,
"learning_rate": 3.328976034858388e-05,
"loss": 0.3983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42586424946784973,
"step": 765,
"valid_targets_mean": 3924.8,
"valid_targets_min": 909
},
{
"epoch": 0.5873379099923722,
"grad_norm": 0.4723825484517219,
"learning_rate": 3.3507625272331155e-05,
"loss": 0.3924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.365474134683609,
"step": 770,
"valid_targets_mean": 4569.1,
"valid_targets_min": 1411
},
{
"epoch": 0.5911517925247902,
"grad_norm": 0.4771358236427614,
"learning_rate": 3.372549019607844e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36031606793403625,
"step": 775,
"valid_targets_mean": 4408.3,
"valid_targets_min": 1060
},
{
"epoch": 0.5949656750572082,
"grad_norm": 0.5880545694161227,
"learning_rate": 3.3943355119825714e-05,
"loss": 0.39,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3750080168247223,
"step": 780,
"valid_targets_mean": 3936.3,
"valid_targets_min": 1230
},
{
"epoch": 0.5987795575896262,
"grad_norm": 0.489467269189964,
"learning_rate": 3.416122004357299e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36050716042518616,
"step": 785,
"valid_targets_mean": 4176.9,
"valid_targets_min": 306
},
{
"epoch": 0.6025934401220442,
"grad_norm": 0.5536794566949234,
"learning_rate": 3.4379084967320266e-05,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35600319504737854,
"step": 790,
"valid_targets_mean": 3812.0,
"valid_targets_min": 917
},
{
"epoch": 0.6064073226544623,
"grad_norm": 0.4902508002712552,
"learning_rate": 3.459694989106754e-05,
"loss": 0.3599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34459996223449707,
"step": 795,
"valid_targets_mean": 4373.7,
"valid_targets_min": 991
},
{
"epoch": 0.6102212051868803,
"grad_norm": 0.4998517004871938,
"learning_rate": 3.481481481481482e-05,
"loss": 0.3935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.411490797996521,
"step": 800,
"valid_targets_mean": 5246.0,
"valid_targets_min": 927
},
{
"epoch": 0.6140350877192983,
"grad_norm": 0.47895938853802045,
"learning_rate": 3.5032679738562094e-05,
"loss": 0.3771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38547301292419434,
"step": 805,
"valid_targets_mean": 5198.0,
"valid_targets_min": 1305
},
{
"epoch": 0.6178489702517163,
"grad_norm": 0.5004860108698085,
"learning_rate": 3.525054466230937e-05,
"loss": 0.3687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3470894396305084,
"step": 810,
"valid_targets_mean": 3868.3,
"valid_targets_min": 840
},
{
"epoch": 0.6216628527841342,
"grad_norm": 0.5060663282767479,
"learning_rate": 3.546840958605665e-05,
"loss": 0.4047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39354002475738525,
"step": 815,
"valid_targets_mean": 4378.5,
"valid_targets_min": 1324
},
{
"epoch": 0.6254767353165522,
"grad_norm": 1.6522740852946434,
"learning_rate": 3.568627450980393e-05,
"loss": 0.6681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7057502865791321,
"step": 820,
"valid_targets_mean": 834.8,
"valid_targets_min": 622
},
{
"epoch": 0.6292906178489702,
"grad_norm": 0.5115480729000605,
"learning_rate": 3.59041394335512e-05,
"loss": 0.3951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3566841185092926,
"step": 825,
"valid_targets_mean": 4504.2,
"valid_targets_min": 356
},
{
"epoch": 0.6331045003813882,
"grad_norm": 0.5430480146137391,
"learning_rate": 3.6122004357298475e-05,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38058558106422424,
"step": 830,
"valid_targets_mean": 4257.1,
"valid_targets_min": 1598
},
{
"epoch": 0.6369183829138062,
"grad_norm": 0.540378079231876,
"learning_rate": 3.633986928104575e-05,
"loss": 0.3767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35072061419487,
"step": 835,
"valid_targets_mean": 4133.5,
"valid_targets_min": 1372
},
{
"epoch": 0.6407322654462243,
"grad_norm": 0.5004544935516848,
"learning_rate": 3.6557734204793034e-05,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33233800530433655,
"step": 840,
"valid_targets_mean": 4052.1,
"valid_targets_min": 657
},
{
"epoch": 0.6445461479786423,
"grad_norm": 0.5183298816243558,
"learning_rate": 3.677559912854031e-05,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4036792814731598,
"step": 845,
"valid_targets_mean": 4681.9,
"valid_targets_min": 946
},
{
"epoch": 0.6483600305110603,
"grad_norm": 0.4847317504698284,
"learning_rate": 3.699346405228759e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40551283955574036,
"step": 850,
"valid_targets_mean": 5111.8,
"valid_targets_min": 1202
},
{
"epoch": 0.6521739130434783,
"grad_norm": 0.4932653055447772,
"learning_rate": 3.7211328976034856e-05,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4025735855102539,
"step": 855,
"valid_targets_mean": 5248.5,
"valid_targets_min": 1118
},
{
"epoch": 0.6559877955758963,
"grad_norm": 0.47245011161392636,
"learning_rate": 3.742919389978214e-05,
"loss": 0.3887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3714592754840851,
"step": 860,
"valid_targets_mean": 4735.7,
"valid_targets_min": 1169
},
{
"epoch": 0.6598016781083142,
"grad_norm": 0.48874913799650793,
"learning_rate": 3.7647058823529415e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35503053665161133,
"step": 865,
"valid_targets_mean": 4341.5,
"valid_targets_min": 514
},
{
"epoch": 0.6636155606407322,
"grad_norm": 0.4993317096416843,
"learning_rate": 3.786492374727669e-05,
"loss": 0.3727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3757993280887604,
"step": 870,
"valid_targets_mean": 4060.4,
"valid_targets_min": 793
},
{
"epoch": 0.6674294431731502,
"grad_norm": 0.5080718314678389,
"learning_rate": 3.808278867102397e-05,
"loss": 0.3799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35796621441841125,
"step": 875,
"valid_targets_mean": 4294.8,
"valid_targets_min": 943
},
{
"epoch": 0.6712433257055682,
"grad_norm": 0.5139513225612712,
"learning_rate": 3.8300653594771244e-05,
"loss": 0.3826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40277424454689026,
"step": 880,
"valid_targets_mean": 4046.4,
"valid_targets_min": 1159
},
{
"epoch": 0.6750572082379863,
"grad_norm": 0.4825425455442106,
"learning_rate": 3.851851851851852e-05,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3549913465976715,
"step": 885,
"valid_targets_mean": 4678.9,
"valid_targets_min": 1080
},
{
"epoch": 0.6788710907704043,
"grad_norm": 0.46169037581763467,
"learning_rate": 3.8736383442265796e-05,
"loss": 0.3582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3371763229370117,
"step": 890,
"valid_targets_mean": 4274.1,
"valid_targets_min": 1006
},
{
"epoch": 0.6826849733028223,
"grad_norm": 0.5736539263411012,
"learning_rate": 3.895424836601307e-05,
"loss": 0.3746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3682954013347626,
"step": 895,
"valid_targets_mean": 3701.7,
"valid_targets_min": 1264
},
{
"epoch": 0.6864988558352403,
"grad_norm": 0.4573138967748284,
"learning_rate": 3.917211328976035e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203882873058319,
"step": 900,
"valid_targets_mean": 5214.0,
"valid_targets_min": 1596
},
{
"epoch": 0.6903127383676583,
"grad_norm": 0.5220685316176321,
"learning_rate": 3.938997821350763e-05,
"loss": 0.3892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.398406982421875,
"step": 905,
"valid_targets_mean": 3611.3,
"valid_targets_min": 906
},
{
"epoch": 0.6941266209000763,
"grad_norm": 0.578745321361813,
"learning_rate": 3.960784313725491e-05,
"loss": 0.3721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.368577241897583,
"step": 910,
"valid_targets_mean": 3772.9,
"valid_targets_min": 431
},
{
"epoch": 0.6979405034324943,
"grad_norm": 0.47869296323020866,
"learning_rate": 3.9825708061002184e-05,
"loss": 0.3771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3765166699886322,
"step": 915,
"valid_targets_mean": 4115.8,
"valid_targets_min": 843
},
{
"epoch": 0.7017543859649122,
"grad_norm": 0.4290499852367467,
"learning_rate": 3.9999998553079044e-05,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34164825081825256,
"step": 920,
"valid_targets_mean": 4980.8,
"valid_targets_min": 2055
},
{
"epoch": 0.7055682684973302,
"grad_norm": 0.4827158139422963,
"learning_rate": 3.9999947910867415e-05,
"loss": 0.3806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4111228287220001,
"step": 925,
"valid_targets_mean": 5021.9,
"valid_targets_min": 1334
},
{
"epoch": 0.7093821510297483,
"grad_norm": 0.565668431178144,
"learning_rate": 3.9999824922817136e-05,
"loss": 0.3899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3945969343185425,
"step": 930,
"valid_targets_mean": 3504.0,
"valid_targets_min": 994
},
{
"epoch": 0.7131960335621663,
"grad_norm": 0.5207733100448804,
"learning_rate": 3.999962958937309e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3764989674091339,
"step": 935,
"valid_targets_mean": 4280.6,
"valid_targets_min": 1070
},
{
"epoch": 0.7170099160945843,
"grad_norm": 0.4961113556289845,
"learning_rate": 3.999936191124184e-05,
"loss": 0.3751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40078458189964294,
"step": 940,
"valid_targets_mean": 4046.6,
"valid_targets_min": 1336
},
{
"epoch": 0.7208237986270023,
"grad_norm": 0.5462231749803261,
"learning_rate": 3.999902188939168e-05,
"loss": 0.3784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38428983092308044,
"step": 945,
"valid_targets_mean": 4143.9,
"valid_targets_min": 859
},
{
"epoch": 0.7246376811594203,
"grad_norm": 0.4504728537471523,
"learning_rate": 3.999860952505256e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38030561804771423,
"step": 950,
"valid_targets_mean": 5215.9,
"valid_targets_min": 1424
},
{
"epoch": 0.7284515636918383,
"grad_norm": 0.46112814246368733,
"learning_rate": 3.999812481971613e-05,
"loss": 0.3626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35764268040657043,
"step": 955,
"valid_targets_mean": 4956.2,
"valid_targets_min": 1100
},
{
"epoch": 0.7322654462242563,
"grad_norm": 0.5093811115162794,
"learning_rate": 3.999756777513573e-05,
"loss": 0.3814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38869643211364746,
"step": 960,
"valid_targets_mean": 4663.0,
"valid_targets_min": 1162
},
{
"epoch": 0.7360793287566743,
"grad_norm": 0.5166363577249488,
"learning_rate": 3.999693839332633e-05,
"loss": 0.3706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.345225065946579,
"step": 965,
"valid_targets_mean": 4345.2,
"valid_targets_min": 1173
},
{
"epoch": 0.7398932112890922,
"grad_norm": 0.43456501611751824,
"learning_rate": 3.9996236676564606e-05,
"loss": 0.3893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3924640715122223,
"step": 970,
"valid_targets_mean": 5048.5,
"valid_targets_min": 467
},
{
"epoch": 0.7437070938215103,
"grad_norm": 0.4528833919025705,
"learning_rate": 3.9995462627388884e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3907564878463745,
"step": 975,
"valid_targets_mean": 5262.2,
"valid_targets_min": 1557
},
{
"epoch": 0.7475209763539283,
"grad_norm": 0.44803105770779067,
"learning_rate": 3.999461624859913e-05,
"loss": 0.3779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3801683187484741,
"step": 980,
"valid_targets_mean": 5022.8,
"valid_targets_min": 1333
},
{
"epoch": 0.7513348588863463,
"grad_norm": 1.3945522001589343,
"learning_rate": 3.999369754325694e-05,
"loss": 0.5941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7252269387245178,
"step": 985,
"valid_targets_mean": 882.6,
"valid_targets_min": 583
},
{
"epoch": 0.7551487414187643,
"grad_norm": 0.4459691668091537,
"learning_rate": 3.999270651468557e-05,
"loss": 0.3752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3678567707538605,
"step": 990,
"valid_targets_mean": 4537.0,
"valid_targets_min": 843
},
{
"epoch": 0.7589626239511823,
"grad_norm": 0.6787380715262016,
"learning_rate": 3.999164316646985e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43198099732398987,
"step": 995,
"valid_targets_mean": 4426.8,
"valid_targets_min": 1103
},
{
"epoch": 0.7627765064836003,
"grad_norm": 0.5234474839142296,
"learning_rate": 3.999050750245624e-05,
"loss": 0.3541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3377021253108978,
"step": 1000,
"valid_targets_mean": 3565.2,
"valid_targets_min": 1013
},
{
"epoch": 0.7665903890160183,
"grad_norm": 0.4701290801073301,
"learning_rate": 3.998929952675278e-05,
"loss": 0.3944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39100274443626404,
"step": 1005,
"valid_targets_mean": 5459.8,
"valid_targets_min": 1291
},
{
"epoch": 0.7704042715484363,
"grad_norm": 0.4887301565086132,
"learning_rate": 3.998801924372908e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41781285405158997,
"step": 1010,
"valid_targets_mean": 4056.2,
"valid_targets_min": 1102
},
{
"epoch": 0.7742181540808543,
"grad_norm": 0.46737377548754167,
"learning_rate": 3.99866666580163e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3446056842803955,
"step": 1015,
"valid_targets_mean": 4130.0,
"valid_targets_min": 327
},
{
"epoch": 0.7780320366132724,
"grad_norm": 0.47600381282403187,
"learning_rate": 3.9985241774507164e-05,
"loss": 0.3785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3605664074420929,
"step": 1020,
"valid_targets_mean": 4542.7,
"valid_targets_min": 1212
},
{
"epoch": 0.7818459191456903,
"grad_norm": 0.4522050546091532,
"learning_rate": 3.998374459835591e-05,
"loss": 0.3638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36169174313545227,
"step": 1025,
"valid_targets_mean": 4604.6,
"valid_targets_min": 420
},
{
"epoch": 0.7856598016781083,
"grad_norm": 0.49172411587001463,
"learning_rate": 3.998217513497825e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3846949636936188,
"step": 1030,
"valid_targets_mean": 4501.2,
"valid_targets_min": 1410
},
{
"epoch": 0.7894736842105263,
"grad_norm": 0.441370684061777,
"learning_rate": 3.998053339005142e-05,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33769798278808594,
"step": 1035,
"valid_targets_mean": 4676.2,
"valid_targets_min": 577
},
{
"epoch": 0.7932875667429443,
"grad_norm": 0.5082455341543946,
"learning_rate": 3.9978819369514115e-05,
"loss": 0.3569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3954106569290161,
"step": 1040,
"valid_targets_mean": 3732.4,
"valid_targets_min": 1297
},
{
"epoch": 0.7971014492753623,
"grad_norm": 0.5239126884155341,
"learning_rate": 3.997703307956646e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37683117389678955,
"step": 1045,
"valid_targets_mean": 4162.2,
"valid_targets_min": 929
},
{
"epoch": 0.8009153318077803,
"grad_norm": 0.45893851228954163,
"learning_rate": 3.9975174526669994e-05,
"loss": 0.373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3459120988845825,
"step": 1050,
"valid_targets_mean": 4355.8,
"valid_targets_min": 1475
},
{
"epoch": 0.8047292143401983,
"grad_norm": 0.5054974279416519,
"learning_rate": 3.997324371754767e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38253259658813477,
"step": 1055,
"valid_targets_mean": 4271.6,
"valid_targets_min": 877
},
{
"epoch": 0.8085430968726163,
"grad_norm": 0.5185372806749117,
"learning_rate": 3.9971240659183805e-05,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4232671558856964,
"step": 1060,
"valid_targets_mean": 4016.3,
"valid_targets_min": 1584
},
{
"epoch": 0.8123569794050344,
"grad_norm": 0.5512258043463327,
"learning_rate": 3.996916535882407e-05,
"loss": 0.3762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41251853108406067,
"step": 1065,
"valid_targets_mean": 3834.4,
"valid_targets_min": 963
},
{
"epoch": 0.8161708619374524,
"grad_norm": 0.49799468322654605,
"learning_rate": 3.996701782397544e-05,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3488624393939972,
"step": 1070,
"valid_targets_mean": 4394.7,
"valid_targets_min": 971
},
{
"epoch": 0.8199847444698704,
"grad_norm": 0.4404711299084823,
"learning_rate": 3.9964798062406205e-05,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3426206409931183,
"step": 1075,
"valid_targets_mean": 5370.3,
"valid_targets_min": 930
},
{
"epoch": 0.8237986270022883,
"grad_norm": 0.4720172689171758,
"learning_rate": 3.996250608214591e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35691210627555847,
"step": 1080,
"valid_targets_mean": 4801.6,
"valid_targets_min": 1460
},
{
"epoch": 0.8276125095347063,
"grad_norm": 0.5500897649466603,
"learning_rate": 3.996014189148534e-05,
"loss": 0.3842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39323708415031433,
"step": 1085,
"valid_targets_mean": 3530.9,
"valid_targets_min": 516
},
{
"epoch": 0.8314263920671243,
"grad_norm": 0.5199194226587828,
"learning_rate": 3.995770549897648e-05,
"loss": 0.3816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38213369250297546,
"step": 1090,
"valid_targets_mean": 5115.5,
"valid_targets_min": 1055
},
{
"epoch": 0.8352402745995423,
"grad_norm": 0.762344226599133,
"learning_rate": 3.9955196913432506e-05,
"loss": 0.3641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3407316207885742,
"step": 1095,
"valid_targets_mean": 4745.6,
"valid_targets_min": 1724
},
{
"epoch": 0.8390541571319603,
"grad_norm": 0.4767081980686291,
"learning_rate": 3.995261614392771e-05,
"loss": 0.3519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3628446161746979,
"step": 1100,
"valid_targets_mean": 4455.9,
"valid_targets_min": 1123
},
{
"epoch": 0.8428680396643783,
"grad_norm": 0.4603493033632945,
"learning_rate": 3.994996319979753e-05,
"loss": 0.3847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37550342082977295,
"step": 1105,
"valid_targets_mean": 4831.5,
"valid_targets_min": 1362
},
{
"epoch": 0.8466819221967964,
"grad_norm": 0.4321868829723287,
"learning_rate": 3.9947238090638455e-05,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32966333627700806,
"step": 1110,
"valid_targets_mean": 5257.2,
"valid_targets_min": 2401
},
{
"epoch": 0.8504958047292144,
"grad_norm": 0.4928212125106336,
"learning_rate": 3.994444082630803e-05,
"loss": 0.3718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40663325786590576,
"step": 1115,
"valid_targets_mean": 4272.6,
"valid_targets_min": 1201
},
{
"epoch": 0.8543096872616324,
"grad_norm": 0.5369422324647564,
"learning_rate": 3.99415714169248e-05,
"loss": 0.3744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38518229126930237,
"step": 1120,
"valid_targets_mean": 4210.9,
"valid_targets_min": 1195
},
{
"epoch": 0.8581235697940504,
"grad_norm": 0.531536440074966,
"learning_rate": 3.993862987286829e-05,
"loss": 0.3624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34791314601898193,
"step": 1125,
"valid_targets_mean": 4195.2,
"valid_targets_min": 908
},
{
"epoch": 0.8619374523264683,
"grad_norm": 0.5120386360242026,
"learning_rate": 3.993561620477894e-05,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4098881781101227,
"step": 1130,
"valid_targets_mean": 4433.9,
"valid_targets_min": 861
},
{
"epoch": 0.8657513348588863,
"grad_norm": 0.5546229292064857,
"learning_rate": 3.993253042355811e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38434138894081116,
"step": 1135,
"valid_targets_mean": 4411.3,
"valid_targets_min": 1015
},
{
"epoch": 0.8695652173913043,
"grad_norm": 0.4847205687071689,
"learning_rate": 3.992937254036798e-05,
"loss": 0.3689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35996517539024353,
"step": 1140,
"valid_targets_mean": 4372.5,
"valid_targets_min": 730
},
{
"epoch": 0.8733790999237223,
"grad_norm": 0.496578789451106,
"learning_rate": 3.992614256663159e-05,
"loss": 0.3809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38061416149139404,
"step": 1145,
"valid_targets_mean": 3699.5,
"valid_targets_min": 1064
},
{
"epoch": 0.8771929824561403,
"grad_norm": 1.3174959384842835,
"learning_rate": 3.992284051403272e-05,
"loss": 0.6232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7174744009971619,
"step": 1150,
"valid_targets_mean": 924.8,
"valid_targets_min": 595
},
{
"epoch": 0.8810068649885584,
"grad_norm": 0.5184996714136828,
"learning_rate": 3.991946639451588e-05,
"loss": 0.3731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36945977807044983,
"step": 1155,
"valid_targets_mean": 3840.2,
"valid_targets_min": 1092
},
{
"epoch": 0.8848207475209764,
"grad_norm": 0.5374317618484389,
"learning_rate": 3.991602022028628e-05,
"loss": 0.3579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3723803460597992,
"step": 1160,
"valid_targets_mean": 4231.3,
"valid_targets_min": 427
},
{
"epoch": 0.8886346300533944,
"grad_norm": 0.44966249003897346,
"learning_rate": 3.991250200380978e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32036292552948,
"step": 1165,
"valid_targets_mean": 4182.4,
"valid_targets_min": 1484
},
{
"epoch": 0.8924485125858124,
"grad_norm": 0.4823324463114382,
"learning_rate": 3.9908911757812816e-05,
"loss": 0.3684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.328177809715271,
"step": 1170,
"valid_targets_mean": 3529.1,
"valid_targets_min": 437
},
{
"epoch": 0.8962623951182304,
"grad_norm": 0.4552734443679323,
"learning_rate": 3.99052494952824e-05,
"loss": 0.3835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3691507875919342,
"step": 1175,
"valid_targets_mean": 4576.7,
"valid_targets_min": 530
},
{
"epoch": 0.9000762776506483,
"grad_norm": 0.48871644633752215,
"learning_rate": 3.9901515229466035e-05,
"loss": 0.357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3446696698665619,
"step": 1180,
"valid_targets_mean": 3823.9,
"valid_targets_min": 1160
},
{
"epoch": 0.9038901601830663,
"grad_norm": 0.49070083319956265,
"learning_rate": 3.98977089738717e-05,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41360974311828613,
"step": 1185,
"valid_targets_mean": 4416.5,
"valid_targets_min": 705
},
{
"epoch": 0.9077040427154843,
"grad_norm": 0.5313518804759381,
"learning_rate": 3.9893830742267734e-05,
"loss": 0.3682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38949641585350037,
"step": 1190,
"valid_targets_mean": 6101.7,
"valid_targets_min": 894
},
{
"epoch": 0.9115179252479023,
"grad_norm": 0.4604256113230519,
"learning_rate": 3.9889880548682896e-05,
"loss": 0.3696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38642418384552,
"step": 1195,
"valid_targets_mean": 4514.3,
"valid_targets_min": 1035
},
{
"epoch": 0.9153318077803204,
"grad_norm": 0.47292655188438054,
"learning_rate": 3.988585840740623e-05,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37636706233024597,
"step": 1200,
"valid_targets_mean": 4110.0,
"valid_targets_min": 442
},
{
"epoch": 0.9191456903127384,
"grad_norm": 0.43282070896702063,
"learning_rate": 3.988176433298701e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38640037178993225,
"step": 1205,
"valid_targets_mean": 5378.8,
"valid_targets_min": 1510
},
{
"epoch": 0.9229595728451564,
"grad_norm": 0.5020061109814692,
"learning_rate": 3.987759834023477e-05,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.363527774810791,
"step": 1210,
"valid_targets_mean": 4316.7,
"valid_targets_min": 434
},
{
"epoch": 0.9267734553775744,
"grad_norm": 0.4642198593500714,
"learning_rate": 3.9873360444219125e-05,
"loss": 0.3755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37602806091308594,
"step": 1215,
"valid_targets_mean": 4150.8,
"valid_targets_min": 1320
},
{
"epoch": 0.9305873379099924,
"grad_norm": 0.5016336613847343,
"learning_rate": 3.986905066026985e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3845888674259186,
"step": 1220,
"valid_targets_mean": 3580.5,
"valid_targets_min": 952
},
{
"epoch": 0.9344012204424104,
"grad_norm": 0.4361161272703576,
"learning_rate": 3.9864669003976725e-05,
"loss": 0.3553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3639432489871979,
"step": 1225,
"valid_targets_mean": 5493.5,
"valid_targets_min": 1451
},
{
"epoch": 0.9382151029748284,
"grad_norm": 0.4678700452231829,
"learning_rate": 3.986021549118951e-05,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3865402042865753,
"step": 1230,
"valid_targets_mean": 4640.3,
"valid_targets_min": 1688
},
{
"epoch": 0.9420289855072463,
"grad_norm": 0.4582516805863473,
"learning_rate": 3.985569013801791e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.344419002532959,
"step": 1235,
"valid_targets_mean": 4298.5,
"valid_targets_min": 1232
},
{
"epoch": 0.9458428680396643,
"grad_norm": 0.5508795531110707,
"learning_rate": 3.985109296083149e-05,
"loss": 0.3782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35687825083732605,
"step": 1240,
"valid_targets_mean": 4338.5,
"valid_targets_min": 1302
},
{
"epoch": 0.9496567505720824,
"grad_norm": 0.46268472568580293,
"learning_rate": 3.9846423976259636e-05,
"loss": 0.3554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33932235836982727,
"step": 1245,
"valid_targets_mean": 4154.8,
"valid_targets_min": 268
},
{
"epoch": 0.9534706331045004,
"grad_norm": 0.43968402739940654,
"learning_rate": 3.984168320119146e-05,
"loss": 0.3521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32227084040641785,
"step": 1250,
"valid_targets_mean": 4389.7,
"valid_targets_min": 1339
},
{
"epoch": 0.9572845156369184,
"grad_norm": 0.44988479442594437,
"learning_rate": 3.983687065277577e-05,
"loss": 0.3646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3949045240879059,
"step": 1255,
"valid_targets_mean": 4869.5,
"valid_targets_min": 504
},
{
"epoch": 0.9610983981693364,
"grad_norm": 0.40537038635756434,
"learning_rate": 3.983198634842103e-05,
"loss": 0.3501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3526088297367096,
"step": 1260,
"valid_targets_mean": 5280.7,
"valid_targets_min": 1398
},
{
"epoch": 0.9649122807017544,
"grad_norm": 0.4874777591749203,
"learning_rate": 3.98270303057952e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3578772246837616,
"step": 1265,
"valid_targets_mean": 3603.2,
"valid_targets_min": 885
},
{
"epoch": 0.9687261632341724,
"grad_norm": 0.5168742238318518,
"learning_rate": 3.982200254282582e-05,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3917689621448517,
"step": 1270,
"valid_targets_mean": 4895.9,
"valid_targets_min": 1220
},
{
"epoch": 0.9725400457665904,
"grad_norm": 0.4316036947777234,
"learning_rate": 3.981690307769979e-05,
"loss": 0.3573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3554462194442749,
"step": 1275,
"valid_targets_mean": 5234.3,
"valid_targets_min": 1270
},
{
"epoch": 0.9763539282990084,
"grad_norm": 0.429176169776203,
"learning_rate": 3.981173192886344e-05,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3734845221042633,
"step": 1280,
"valid_targets_mean": 4930.2,
"valid_targets_min": 1275
},
{
"epoch": 0.9801678108314263,
"grad_norm": 0.4957017873240747,
"learning_rate": 3.9806489115022354e-05,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3890209496021271,
"step": 1285,
"valid_targets_mean": 4734.1,
"valid_targets_min": 949
},
{
"epoch": 0.9839816933638444,
"grad_norm": 0.5143350218465076,
"learning_rate": 3.980117465514138e-05,
"loss": 0.3723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.364015132188797,
"step": 1290,
"valid_targets_mean": 3851.5,
"valid_targets_min": 1105
},
{
"epoch": 0.9877955758962624,
"grad_norm": 0.45135446002856094,
"learning_rate": 3.979578856844452e-05,
"loss": 0.3596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34121426939964294,
"step": 1295,
"valid_targets_mean": 4531.8,
"valid_targets_min": 1130
},
{
"epoch": 0.9916094584286804,
"grad_norm": 0.45261428570516965,
"learning_rate": 3.9790330874414866e-05,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3475932776927948,
"step": 1300,
"valid_targets_mean": 4569.3,
"valid_targets_min": 1345
},
{
"epoch": 0.9954233409610984,
"grad_norm": 0.5036230227201647,
"learning_rate": 3.978480159279455e-05,
"loss": 0.3675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40386661887168884,
"step": 1305,
"valid_targets_mean": 4841.8,
"valid_targets_min": 1035
},
{
"epoch": 0.9992372234935164,
"grad_norm": 1.4960925211456237,
"learning_rate": 3.9779200743584644e-05,
"loss": 0.5992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7448456883430481,
"step": 1310,
"valid_targets_mean": 893.5,
"valid_targets_min": 437
},
{
"epoch": 1.0030511060259344,
"grad_norm": 0.4793463160181418,
"learning_rate": 3.977352834704512e-05,
"loss": 0.4091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33799681067466736,
"step": 1315,
"valid_targets_mean": 5001.8,
"valid_targets_min": 1201
},
{
"epoch": 1.0068649885583525,
"grad_norm": 0.5438675684910989,
"learning_rate": 3.976778442369472e-05,
"loss": 0.3658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3457205295562744,
"step": 1320,
"valid_targets_mean": 3972.8,
"valid_targets_min": 1183
},
{
"epoch": 1.0106788710907704,
"grad_norm": 0.5140942413587252,
"learning_rate": 3.9761968994310966e-05,
"loss": 0.3708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3165968954563141,
"step": 1325,
"valid_targets_mean": 4328.2,
"valid_targets_min": 1027
},
{
"epoch": 1.0144927536231885,
"grad_norm": 0.45617290652451703,
"learning_rate": 3.975608207993002e-05,
"loss": 0.3639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3801937401294708,
"step": 1330,
"valid_targets_mean": 3989.0,
"valid_targets_min": 1000
},
{
"epoch": 1.0183066361556063,
"grad_norm": 0.4341972844635562,
"learning_rate": 3.9750123701846615e-05,
"loss": 0.358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3951098918914795,
"step": 1335,
"valid_targets_mean": 4721.1,
"valid_targets_min": 1509
},
{
"epoch": 1.0221205186880244,
"grad_norm": 0.46730836638900286,
"learning_rate": 3.974409388161401e-05,
"loss": 0.3683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40257081389427185,
"step": 1340,
"valid_targets_mean": 4757.3,
"valid_targets_min": 579
},
{
"epoch": 1.0259344012204423,
"grad_norm": 0.5515646605187918,
"learning_rate": 3.973799264104387e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36521920561790466,
"step": 1345,
"valid_targets_mean": 3518.1,
"valid_targets_min": 703
},
{
"epoch": 1.0297482837528604,
"grad_norm": 0.470326967727145,
"learning_rate": 3.973182000220622e-05,
"loss": 0.3873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38522180914878845,
"step": 1350,
"valid_targets_mean": 4128.1,
"valid_targets_min": 1327
},
{
"epoch": 1.0335621662852783,
"grad_norm": 0.40705686780411454,
"learning_rate": 3.972557598742938e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122781217098236,
"step": 1355,
"valid_targets_mean": 4659.9,
"valid_targets_min": 1388
},
{
"epoch": 1.0373760488176964,
"grad_norm": 0.44803605568572163,
"learning_rate": 3.9719260619299806e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36841270327568054,
"step": 1360,
"valid_targets_mean": 4919.1,
"valid_targets_min": 825
},
{
"epoch": 1.0411899313501145,
"grad_norm": 0.46321347066260277,
"learning_rate": 3.9712873920662096e-05,
"loss": 0.3511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3696576654911041,
"step": 1365,
"valid_targets_mean": 4718.7,
"valid_targets_min": 1230
},
{
"epoch": 1.0450038138825324,
"grad_norm": 0.5080500551538887,
"learning_rate": 3.970641591461886e-05,
"loss": 0.3581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33408328890800476,
"step": 1370,
"valid_targets_mean": 3776.7,
"valid_targets_min": 921
},
{
"epoch": 1.0488176964149505,
"grad_norm": 0.4401310958483072,
"learning_rate": 3.9699886624530664e-05,
"loss": 0.3579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32947924733161926,
"step": 1375,
"valid_targets_mean": 5090.0,
"valid_targets_min": 947
},
{
"epoch": 1.0526315789473684,
"grad_norm": 0.45200095524939027,
"learning_rate": 3.9693286074015904e-05,
"loss": 0.345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3618582785129547,
"step": 1380,
"valid_targets_mean": 4528.5,
"valid_targets_min": 711
},
{
"epoch": 1.0564454614797865,
"grad_norm": 0.47049293711643714,
"learning_rate": 3.968661428695077e-05,
"loss": 0.3713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3690056800842285,
"step": 1385,
"valid_targets_mean": 4277.3,
"valid_targets_min": 917
},
{
"epoch": 1.0602593440122043,
"grad_norm": 0.4737449066959073,
"learning_rate": 3.967987128746913e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4023532569408417,
"step": 1390,
"valid_targets_mean": 4950.3,
"valid_targets_min": 1222
},
{
"epoch": 1.0640732265446224,
"grad_norm": 0.49450505312447235,
"learning_rate": 3.967305709996243e-05,
"loss": 0.3555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3727036416530609,
"step": 1395,
"valid_targets_mean": 4383.7,
"valid_targets_min": 531
},
{
"epoch": 1.0678871090770405,
"grad_norm": 0.5028180651368124,
"learning_rate": 3.966617174907965e-05,
"loss": 0.3592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37223827838897705,
"step": 1400,
"valid_targets_mean": 3776.0,
"valid_targets_min": 1426
},
{
"epoch": 1.0717009916094584,
"grad_norm": 0.43787090970748827,
"learning_rate": 3.965921525972717e-05,
"loss": 0.354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3454868495464325,
"step": 1405,
"valid_targets_mean": 5180.0,
"valid_targets_min": 1199
},
{
"epoch": 1.0755148741418765,
"grad_norm": 0.4319389732299042,
"learning_rate": 3.965218765706872e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3510608971118927,
"step": 1410,
"valid_targets_mean": 5052.3,
"valid_targets_min": 1547
},
{
"epoch": 1.0793287566742944,
"grad_norm": 0.48206632149639017,
"learning_rate": 3.964508896652525e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36549773812294006,
"step": 1415,
"valid_targets_mean": 4058.3,
"valid_targets_min": 1098
},
{
"epoch": 1.0831426392067125,
"grad_norm": 0.4967406185966264,
"learning_rate": 3.9637919213774874e-05,
"loss": 0.3693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4231281280517578,
"step": 1420,
"valid_targets_mean": 4121.5,
"valid_targets_min": 1049
},
{
"epoch": 1.0869565217391304,
"grad_norm": 0.4878295316799637,
"learning_rate": 3.9630678424752735e-05,
"loss": 0.3531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37907230854034424,
"step": 1425,
"valid_targets_mean": 4030.7,
"valid_targets_min": 1407
},
{
"epoch": 1.0907704042715485,
"grad_norm": 0.5465674854063036,
"learning_rate": 3.962336662565095e-05,
"loss": 0.3653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4150486886501312,
"step": 1430,
"valid_targets_mean": 4677.6,
"valid_targets_min": 1302
},
{
"epoch": 1.0945842868039664,
"grad_norm": 0.49768719325902566,
"learning_rate": 3.96159838429185e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3882100582122803,
"step": 1435,
"valid_targets_mean": 3504.0,
"valid_targets_min": 1117
},
{
"epoch": 1.0983981693363845,
"grad_norm": 0.4537747668323573,
"learning_rate": 3.9608530103261144e-05,
"loss": 0.3349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3308643400669098,
"step": 1440,
"valid_targets_mean": 4242.5,
"valid_targets_min": 1444
},
{
"epoch": 1.1022120518688023,
"grad_norm": 0.5164541178291466,
"learning_rate": 3.960100543364129e-05,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3670574128627777,
"step": 1445,
"valid_targets_mean": 3909.9,
"valid_targets_min": 725
},
{
"epoch": 1.1060259344012204,
"grad_norm": 0.491392353620686,
"learning_rate": 3.959340986127795e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36460360884666443,
"step": 1450,
"valid_targets_mean": 3961.4,
"valid_targets_min": 1059
},
{
"epoch": 1.1098398169336385,
"grad_norm": 0.4847216514006396,
"learning_rate": 3.958574341364659e-05,
"loss": 0.3736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35377323627471924,
"step": 1455,
"valid_targets_mean": 4016.4,
"valid_targets_min": 981
},
{
"epoch": 1.1136536994660564,
"grad_norm": 0.4406608047156622,
"learning_rate": 3.957800611847907e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3387221097946167,
"step": 1460,
"valid_targets_mean": 4490.6,
"valid_targets_min": 1025
},
{
"epoch": 1.1174675819984745,
"grad_norm": 0.5213473880559113,
"learning_rate": 3.95701980037635e-05,
"loss": 0.351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3637104332447052,
"step": 1465,
"valid_targets_mean": 3972.2,
"valid_targets_min": 419
},
{
"epoch": 1.1212814645308924,
"grad_norm": 0.4556617981657067,
"learning_rate": 3.956231909774421e-05,
"loss": 0.358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3975560665130615,
"step": 1470,
"valid_targets_mean": 4520.6,
"valid_targets_min": 972
},
{
"epoch": 1.1250953470633105,
"grad_norm": 0.6469133777791192,
"learning_rate": 3.955436942892156e-05,
"loss": 0.572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4174586534500122,
"step": 1475,
"valid_targets_mean": 2480.5,
"valid_targets_min": 586
},
{
"epoch": 1.1289092295957284,
"grad_norm": 0.5042352279798316,
"learning_rate": 3.9546349026051886e-05,
"loss": 0.3572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3503652513027191,
"step": 1480,
"valid_targets_mean": 4591.0,
"valid_targets_min": 1422
},
{
"epoch": 1.1327231121281465,
"grad_norm": 0.4639759371870002,
"learning_rate": 3.953825791814743e-05,
"loss": 0.3625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3499886989593506,
"step": 1485,
"valid_targets_mean": 4414.1,
"valid_targets_min": 802
},
{
"epoch": 1.1365369946605646,
"grad_norm": 0.49820487639813743,
"learning_rate": 3.9530096134476155e-05,
"loss": 0.3769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4116916358470917,
"step": 1490,
"valid_targets_mean": 4242.8,
"valid_targets_min": 1180
},
{
"epoch": 1.1403508771929824,
"grad_norm": 0.4163673959740096,
"learning_rate": 3.9521863704561684e-05,
"loss": 0.338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3374262750148773,
"step": 1495,
"valid_targets_mean": 4853.1,
"valid_targets_min": 1206
},
{
"epoch": 1.1441647597254005,
"grad_norm": 0.4770566684957642,
"learning_rate": 3.9513560658183216e-05,
"loss": 0.3619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3136308491230011,
"step": 1500,
"valid_targets_mean": 3941.9,
"valid_targets_min": 771
},
{
"epoch": 1.1479786422578184,
"grad_norm": 0.5794955093822997,
"learning_rate": 3.9505187025375346e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.342024564743042,
"step": 1505,
"valid_targets_mean": 4745.8,
"valid_targets_min": 1322
},
{
"epoch": 1.1517925247902365,
"grad_norm": 0.5261646401760552,
"learning_rate": 3.949674283642805e-05,
"loss": 0.3701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3519936501979828,
"step": 1510,
"valid_targets_mean": 2909.0,
"valid_targets_min": 957
},
{
"epoch": 1.1556064073226544,
"grad_norm": 0.43176897604586745,
"learning_rate": 3.94882281218865e-05,
"loss": 0.3629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3459691107273102,
"step": 1515,
"valid_targets_mean": 4479.5,
"valid_targets_min": 1510
},
{
"epoch": 1.1594202898550725,
"grad_norm": 0.45134668768661756,
"learning_rate": 3.9479642912550975e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3575803339481354,
"step": 1520,
"valid_targets_mean": 4954.8,
"valid_targets_min": 1624
},
{
"epoch": 1.1632341723874904,
"grad_norm": 0.47627942604124146,
"learning_rate": 3.947098723947677e-05,
"loss": 0.338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3104186952114105,
"step": 1525,
"valid_targets_mean": 4333.7,
"valid_targets_min": 861
},
{
"epoch": 1.1670480549199085,
"grad_norm": 0.4585945533797258,
"learning_rate": 3.9462261133974066e-05,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37167060375213623,
"step": 1530,
"valid_targets_mean": 4614.9,
"valid_targets_min": 1063
},
{
"epoch": 1.1708619374523264,
"grad_norm": 0.4392639573208927,
"learning_rate": 3.945346462760781e-05,
"loss": 0.3546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3076896667480469,
"step": 1535,
"valid_targets_mean": 3828.2,
"valid_targets_min": 1029
},
{
"epoch": 1.1746758199847445,
"grad_norm": 0.4428160285363157,
"learning_rate": 3.944459775219762e-05,
"loss": 0.3416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3300919532775879,
"step": 1540,
"valid_targets_mean": 4357.5,
"valid_targets_min": 1403
},
{
"epoch": 1.1784897025171626,
"grad_norm": 0.42255626498476845,
"learning_rate": 3.943566053981766e-05,
"loss": 0.359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35865628719329834,
"step": 1545,
"valid_targets_mean": 4991.6,
"valid_targets_min": 1196
},
{
"epoch": 1.1823035850495804,
"grad_norm": 0.4397533808750128,
"learning_rate": 3.942665302279651e-05,
"loss": 0.3396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3123394846916199,
"step": 1550,
"valid_targets_mean": 4861.5,
"valid_targets_min": 1284
},
{
"epoch": 1.1861174675819985,
"grad_norm": 0.4386214823026046,
"learning_rate": 3.941757523371708e-05,
"loss": 0.3447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35547080636024475,
"step": 1555,
"valid_targets_mean": 5120.7,
"valid_targets_min": 1014
},
{
"epoch": 1.1899313501144164,
"grad_norm": 0.40482676317507504,
"learning_rate": 3.940842720541647e-05,
"loss": 0.3493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050001859664917,
"step": 1560,
"valid_targets_mean": 5011.2,
"valid_targets_min": 447
},
{
"epoch": 1.1937452326468345,
"grad_norm": 0.43799832347524176,
"learning_rate": 3.9399208970985854e-05,
"loss": 0.3589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3959282338619232,
"step": 1565,
"valid_targets_mean": 5331.9,
"valid_targets_min": 780
},
{
"epoch": 1.1975591151792524,
"grad_norm": 0.4087742386160605,
"learning_rate": 3.938992056377036e-05,
"loss": 0.3388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34477710723876953,
"step": 1570,
"valid_targets_mean": 4720.4,
"valid_targets_min": 1129
},
{
"epoch": 1.2013729977116705,
"grad_norm": 0.47016536084109734,
"learning_rate": 3.938056201736896e-05,
"loss": 0.3376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3292127549648285,
"step": 1575,
"valid_targets_mean": 4415.0,
"valid_targets_min": 1096
},
{
"epoch": 1.2051868802440886,
"grad_norm": 0.4443565972939098,
"learning_rate": 3.9371133365634345e-05,
"loss": 0.3615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3656719923019409,
"step": 1580,
"valid_targets_mean": 5174.2,
"valid_targets_min": 728
},
{
"epoch": 1.2090007627765065,
"grad_norm": 0.44083945242650846,
"learning_rate": 3.936163464267277e-05,
"loss": 0.3594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34252461791038513,
"step": 1585,
"valid_targets_mean": 4408.7,
"valid_targets_min": 1133
},
{
"epoch": 1.2128146453089246,
"grad_norm": 0.5140162937717304,
"learning_rate": 3.935206588284399e-05,
"loss": 0.3582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32750964164733887,
"step": 1590,
"valid_targets_mean": 3657.9,
"valid_targets_min": 437
},
{
"epoch": 1.2166285278413425,
"grad_norm": 0.5023178879375496,
"learning_rate": 3.93424271207611e-05,
"loss": 0.3721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.412407249212265,
"step": 1595,
"valid_targets_mean": 3667.6,
"valid_targets_min": 924
},
{
"epoch": 1.2204424103737606,
"grad_norm": 0.4393578258491763,
"learning_rate": 3.93327183912904e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2946208715438843,
"step": 1600,
"valid_targets_mean": 3893.6,
"valid_targets_min": 259
},
{
"epoch": 1.2242562929061784,
"grad_norm": 0.458741999764665,
"learning_rate": 3.932293972955128e-05,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37496721744537354,
"step": 1605,
"valid_targets_mean": 5185.8,
"valid_targets_min": 877
},
{
"epoch": 1.2280701754385965,
"grad_norm": 0.418527038541922,
"learning_rate": 3.931309117091612e-05,
"loss": 0.3844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36490917205810547,
"step": 1610,
"valid_targets_mean": 4935.5,
"valid_targets_min": 1328
},
{
"epoch": 1.2318840579710144,
"grad_norm": 0.46733135474543663,
"learning_rate": 3.9303172751010125e-05,
"loss": 0.343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.320946604013443,
"step": 1615,
"valid_targets_mean": 4701.2,
"valid_targets_min": 1053
},
{
"epoch": 1.2356979405034325,
"grad_norm": 0.45296201790488233,
"learning_rate": 3.929318450571119e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3832404911518097,
"step": 1620,
"valid_targets_mean": 4571.2,
"valid_targets_min": 1179
},
{
"epoch": 1.2395118230358504,
"grad_norm": 0.4198962646812139,
"learning_rate": 3.928312647114983e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38623082637786865,
"step": 1625,
"valid_targets_mean": 5367.0,
"valid_targets_min": 1576
},
{
"epoch": 1.2433257055682685,
"grad_norm": 0.7679243209756554,
"learning_rate": 3.9272998683708986e-05,
"loss": 0.3563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3500606119632721,
"step": 1630,
"valid_targets_mean": 4513.1,
"valid_targets_min": 1114
},
{
"epoch": 1.2471395881006866,
"grad_norm": 0.5228173268588197,
"learning_rate": 3.9262801180023906e-05,
"loss": 0.3569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37457337975502014,
"step": 1635,
"valid_targets_mean": 3563.4,
"valid_targets_min": 1235
},
{
"epoch": 1.2509534706331045,
"grad_norm": 1.33047435809795,
"learning_rate": 3.925253399698203e-05,
"loss": 0.6628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6713621616363525,
"step": 1640,
"valid_targets_mean": 904.5,
"valid_targets_min": 535
},
{
"epoch": 1.2547673531655226,
"grad_norm": 0.49263940048523913,
"learning_rate": 3.924219717172287e-05,
"loss": 0.3783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37166628241539,
"step": 1645,
"valid_targets_mean": 5407.8,
"valid_targets_min": 967
},
{
"epoch": 1.2585812356979404,
"grad_norm": 0.47593125119627555,
"learning_rate": 3.923179074163783e-05,
"loss": 0.3523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33608245849609375,
"step": 1650,
"valid_targets_mean": 4629.0,
"valid_targets_min": 942
},
{
"epoch": 1.2623951182303585,
"grad_norm": 0.5443093285946626,
"learning_rate": 3.92213147443701e-05,
"loss": 0.3583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38303980231285095,
"step": 1655,
"valid_targets_mean": 3721.8,
"valid_targets_min": 1239
},
{
"epoch": 1.2662090007627764,
"grad_norm": 0.4699119549454572,
"learning_rate": 3.9210769217814525e-05,
"loss": 0.3571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32681989669799805,
"step": 1660,
"valid_targets_mean": 3964.7,
"valid_targets_min": 1498
},
{
"epoch": 1.2700228832951945,
"grad_norm": 0.5367643229818877,
"learning_rate": 3.920015420011745e-05,
"loss": 0.3697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3740926682949066,
"step": 1665,
"valid_targets_mean": 3617.1,
"valid_targets_min": 1119
},
{
"epoch": 1.2738367658276126,
"grad_norm": 0.4364917789756035,
"learning_rate": 3.91894697296766e-05,
"loss": 0.3499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3437977731227875,
"step": 1670,
"valid_targets_mean": 5194.5,
"valid_targets_min": 506
},
{
"epoch": 1.2776506483600305,
"grad_norm": 0.4648383478668736,
"learning_rate": 3.9178715845140905e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3175346553325653,
"step": 1675,
"valid_targets_mean": 3968.0,
"valid_targets_min": 1443
},
{
"epoch": 1.2814645308924484,
"grad_norm": 0.4580772095759182,
"learning_rate": 3.9167892585410416e-05,
"loss": 0.3559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3617471158504486,
"step": 1680,
"valid_targets_mean": 4163.8,
"valid_targets_min": 1016
},
{
"epoch": 1.2852784134248665,
"grad_norm": 0.420705068027108,
"learning_rate": 3.9156999989636136e-05,
"loss": 0.3435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3555961847305298,
"step": 1685,
"valid_targets_mean": 4794.0,
"valid_targets_min": 1423
},
{
"epoch": 1.2890922959572846,
"grad_norm": 0.4445370315663098,
"learning_rate": 3.914603809721985e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3598546087741852,
"step": 1690,
"valid_targets_mean": 4818.8,
"valid_targets_min": 1828
},
{
"epoch": 1.2929061784897025,
"grad_norm": 0.46001476720088763,
"learning_rate": 3.9135006947814046e-05,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33533012866973877,
"step": 1695,
"valid_targets_mean": 3634.5,
"valid_targets_min": 1127
},
{
"epoch": 1.2967200610221206,
"grad_norm": 0.4605186587488973,
"learning_rate": 3.912390658132169e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31520143151283264,
"step": 1700,
"valid_targets_mean": 3687.9,
"valid_targets_min": 436
},
{
"epoch": 1.3005339435545384,
"grad_norm": 0.5048292450977424,
"learning_rate": 3.9112737037896176e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3381100594997406,
"step": 1705,
"valid_targets_mean": 3859.2,
"valid_targets_min": 1237
},
{
"epoch": 1.3043478260869565,
"grad_norm": 0.4470374365915368,
"learning_rate": 3.910149835794109e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3507278859615326,
"step": 1710,
"valid_targets_mean": 4842.5,
"valid_targets_min": 1110
},
{
"epoch": 1.3081617086193744,
"grad_norm": 0.4725388725302536,
"learning_rate": 3.909019058211014e-05,
"loss": 0.3591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3592679500579834,
"step": 1715,
"valid_targets_mean": 3800.2,
"valid_targets_min": 637
},
{
"epoch": 1.3119755911517925,
"grad_norm": 0.5010840472800245,
"learning_rate": 3.907881375130695e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36546194553375244,
"step": 1720,
"valid_targets_mean": 4041.3,
"valid_targets_min": 931
},
{
"epoch": 1.3157894736842106,
"grad_norm": 0.47479083395813454,
"learning_rate": 3.906736790668495e-05,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34209373593330383,
"step": 1725,
"valid_targets_mean": 3945.6,
"valid_targets_min": 872
},
{
"epoch": 1.3196033562166285,
"grad_norm": 0.5639829384354162,
"learning_rate": 3.90558530896472e-05,
"loss": 0.3469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3194632828235626,
"step": 1730,
"valid_targets_mean": 2889.1,
"valid_targets_min": 734
},
{
"epoch": 1.3234172387490466,
"grad_norm": 0.5903513954151072,
"learning_rate": 3.904426934184628e-05,
"loss": 0.3427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3566388189792633,
"step": 1735,
"valid_targets_mean": 4816.4,
"valid_targets_min": 1084
},
{
"epoch": 1.3272311212814645,
"grad_norm": 0.4503945917654869,
"learning_rate": 3.903261670518408e-05,
"loss": 0.3405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3107925355434418,
"step": 1740,
"valid_targets_mean": 3587.4,
"valid_targets_min": 1143
},
{
"epoch": 1.3310450038138826,
"grad_norm": 0.43065662871245963,
"learning_rate": 3.90208952218117e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3414647877216339,
"step": 1745,
"valid_targets_mean": 4295.7,
"valid_targets_min": 1226
},
{
"epoch": 1.3348588863463005,
"grad_norm": 0.5237745139377946,
"learning_rate": 3.900910493412929e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.316201388835907,
"step": 1750,
"valid_targets_mean": 3234.5,
"valid_targets_min": 279
},
{
"epoch": 1.3386727688787186,
"grad_norm": 0.47093036937632515,
"learning_rate": 3.899724588478586e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39046618342399597,
"step": 1755,
"valid_targets_mean": 4542.8,
"valid_targets_min": 1109
},
{
"epoch": 1.3424866514111367,
"grad_norm": 0.43907041625968424,
"learning_rate": 3.898531811667918e-05,
"loss": 0.3545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38379302620887756,
"step": 1760,
"valid_targets_mean": 4806.4,
"valid_targets_min": 837
},
{
"epoch": 1.3463005339435545,
"grad_norm": 0.4489257140697931,
"learning_rate": 3.8973321672955567e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32360532879829407,
"step": 1765,
"valid_targets_mean": 4818.2,
"valid_targets_min": 1553
},
{
"epoch": 1.3501144164759724,
"grad_norm": 0.42475418240586327,
"learning_rate": 3.896125659700978e-05,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37827810645103455,
"step": 1770,
"valid_targets_mean": 4799.2,
"valid_targets_min": 720
},
{
"epoch": 1.3539282990083905,
"grad_norm": 0.39913389476248523,
"learning_rate": 3.894912293248483e-05,
"loss": 0.3418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32091864943504333,
"step": 1775,
"valid_targets_mean": 5017.3,
"valid_targets_min": 1309
},
{
"epoch": 1.3577421815408086,
"grad_norm": 0.4408505758029835,
"learning_rate": 3.893692072327185e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32390084862709045,
"step": 1780,
"valid_targets_mean": 4561.3,
"valid_targets_min": 1150
},
{
"epoch": 1.3615560640732265,
"grad_norm": 0.4294374639015818,
"learning_rate": 3.89246500135099e-05,
"loss": 0.35,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3629796504974365,
"step": 1785,
"valid_targets_mean": 4894.0,
"valid_targets_min": 773
},
{
"epoch": 1.3653699466056446,
"grad_norm": 0.4357821842127782,
"learning_rate": 3.8912310847585834e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3116796314716339,
"step": 1790,
"valid_targets_mean": 4334.6,
"valid_targets_min": 1197
},
{
"epoch": 1.3691838291380625,
"grad_norm": 0.4082665954305704,
"learning_rate": 3.889990327013412e-05,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2875381410121918,
"step": 1795,
"valid_targets_mean": 4551.9,
"valid_targets_min": 900
},
{
"epoch": 1.3729977116704806,
"grad_norm": 0.4160729509219186,
"learning_rate": 3.8887427326036734e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.331479549407959,
"step": 1800,
"valid_targets_mean": 5323.6,
"valid_targets_min": 942
},
{
"epoch": 1.3768115942028984,
"grad_norm": 0.5546043445045815,
"learning_rate": 3.887488306042291e-05,
"loss": 0.5092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37859976291656494,
"step": 1805,
"valid_targets_mean": 3949.1,
"valid_targets_min": 1206
},
{
"epoch": 1.3806254767353165,
"grad_norm": 0.5594497655541855,
"learning_rate": 3.886227051866903e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3657640516757965,
"step": 1810,
"valid_targets_mean": 3915.1,
"valid_targets_min": 977
},
{
"epoch": 1.3844393592677346,
"grad_norm": 0.45346305540885756,
"learning_rate": 3.884958974639847e-05,
"loss": 0.3484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33822956681251526,
"step": 1815,
"valid_targets_mean": 5037.4,
"valid_targets_min": 268
},
{
"epoch": 1.3882532418001525,
"grad_norm": 0.4420952120039936,
"learning_rate": 3.8836840789481405e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3412349224090576,
"step": 1820,
"valid_targets_mean": 4367.5,
"valid_targets_min": 1371
},
{
"epoch": 1.3920671243325706,
"grad_norm": 0.44468726024354555,
"learning_rate": 3.882402369403464e-05,
"loss": 0.3417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37281331419944763,
"step": 1825,
"valid_targets_mean": 4771.2,
"valid_targets_min": 1556
},
{
"epoch": 1.3958810068649885,
"grad_norm": 0.42890277592066967,
"learning_rate": 3.881113850642149e-05,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33766472339630127,
"step": 1830,
"valid_targets_mean": 4216.5,
"valid_targets_min": 1181
},
{
"epoch": 1.3996948893974066,
"grad_norm": 0.4632207322961925,
"learning_rate": 3.879818527325156e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3948814868927002,
"step": 1835,
"valid_targets_mean": 5034.9,
"valid_targets_min": 1488
},
{
"epoch": 1.4035087719298245,
"grad_norm": 0.4379505402410926,
"learning_rate": 3.878516404138058e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3263804018497467,
"step": 1840,
"valid_targets_mean": 4342.8,
"valid_targets_min": 1501
},
{
"epoch": 1.4073226544622426,
"grad_norm": 0.48956467051524727,
"learning_rate": 3.877207485791028e-05,
"loss": 0.3333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3223048746585846,
"step": 1845,
"valid_targets_mean": 3916.5,
"valid_targets_min": 1133
},
{
"epoch": 1.4111365369946607,
"grad_norm": 0.5061823012263362,
"learning_rate": 3.875891777018818e-05,
"loss": 0.3479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3740794360637665,
"step": 1850,
"valid_targets_mean": 4306.0,
"valid_targets_min": 1533
},
{
"epoch": 1.4149504195270786,
"grad_norm": 0.44374624013085096,
"learning_rate": 3.874569282580744e-05,
"loss": 0.3391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3182269334793091,
"step": 1855,
"valid_targets_mean": 4329.9,
"valid_targets_min": 1148
},
{
"epoch": 1.4187643020594964,
"grad_norm": 0.5282857561363704,
"learning_rate": 3.8732400072606663e-05,
"loss": 0.3278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34093889594078064,
"step": 1860,
"valid_targets_mean": 5093.1,
"valid_targets_min": 360
},
{
"epoch": 1.4225781845919145,
"grad_norm": 0.45036028219991575,
"learning_rate": 3.8719039558669735e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37583938241004944,
"step": 1865,
"valid_targets_mean": 5373.0,
"valid_targets_min": 338
},
{
"epoch": 1.4263920671243326,
"grad_norm": 0.4815351622606479,
"learning_rate": 3.870561133232567e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3166085183620453,
"step": 1870,
"valid_targets_mean": 3829.9,
"valid_targets_min": 1259
},
{
"epoch": 1.4302059496567505,
"grad_norm": 0.48428256336366055,
"learning_rate": 3.8692115442148416e-05,
"loss": 0.3388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3754858672618866,
"step": 1875,
"valid_targets_mean": 4023.9,
"valid_targets_min": 1054
},
{
"epoch": 1.4340198321891686,
"grad_norm": 0.47277520631718617,
"learning_rate": 3.8678551936956654e-05,
"loss": 0.3387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33969607949256897,
"step": 1880,
"valid_targets_mean": 4289.2,
"valid_targets_min": 426
},
{
"epoch": 1.4378337147215865,
"grad_norm": 0.43917915151002945,
"learning_rate": 3.866492086581369e-05,
"loss": 0.3198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32609280943870544,
"step": 1885,
"valid_targets_mean": 4327.0,
"valid_targets_min": 1432
},
{
"epoch": 1.4416475972540046,
"grad_norm": 0.4306387032402162,
"learning_rate": 3.865122227802721e-05,
"loss": 0.3224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789159119129181,
"step": 1890,
"valid_targets_mean": 3979.3,
"valid_targets_min": 1352
},
{
"epoch": 1.4454614797864225,
"grad_norm": 0.4720251886440316,
"learning_rate": 3.863745622314913e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3516583740711212,
"step": 1895,
"valid_targets_mean": 3531.6,
"valid_targets_min": 1374
},
{
"epoch": 1.4492753623188406,
"grad_norm": 0.46609842409964225,
"learning_rate": 3.862362275097543e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3093758821487427,
"step": 1900,
"valid_targets_mean": 4145.7,
"valid_targets_min": 894
},
{
"epoch": 1.4530892448512587,
"grad_norm": 0.5123115804522839,
"learning_rate": 3.8609721911545926e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33074355125427246,
"step": 1905,
"valid_targets_mean": 3831.0,
"valid_targets_min": 970
},
{
"epoch": 1.4569031273836766,
"grad_norm": 0.4406404957264489,
"learning_rate": 3.8595753755144156e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32660233974456787,
"step": 1910,
"valid_targets_mean": 4124.6,
"valid_targets_min": 392
},
{
"epoch": 1.4607170099160947,
"grad_norm": 0.48541201400683953,
"learning_rate": 3.858171833229716e-05,
"loss": 0.3374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3298225700855255,
"step": 1915,
"valid_targets_mean": 4515.6,
"valid_targets_min": 1454
},
{
"epoch": 1.4645308924485125,
"grad_norm": 0.4416063227875788,
"learning_rate": 3.856761569377528e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3587282598018646,
"step": 1920,
"valid_targets_mean": 5149.5,
"valid_targets_min": 1237
},
{
"epoch": 1.4683447749809306,
"grad_norm": 0.4250346119336662,
"learning_rate": 3.8553445890592015e-05,
"loss": 0.3612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39043954014778137,
"step": 1925,
"valid_targets_mean": 5316.2,
"valid_targets_min": 2132
},
{
"epoch": 1.4721586575133485,
"grad_norm": 0.4501574857612335,
"learning_rate": 3.85392089740038e-05,
"loss": 0.3397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33985814452171326,
"step": 1930,
"valid_targets_mean": 4548.2,
"valid_targets_min": 1677
},
{
"epoch": 1.4759725400457666,
"grad_norm": 0.4378789749328793,
"learning_rate": 3.852490499550988e-05,
"loss": 0.3418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32744383811950684,
"step": 1935,
"valid_targets_mean": 4950.3,
"valid_targets_min": 917
},
{
"epoch": 1.4797864225781847,
"grad_norm": 0.5076618596575551,
"learning_rate": 3.851053400685203e-05,
"loss": 0.3577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3824631869792938,
"step": 1940,
"valid_targets_mean": 4252.6,
"valid_targets_min": 1206
},
{
"epoch": 1.4836003051106026,
"grad_norm": 0.48737116555851495,
"learning_rate": 3.849609606001446e-05,
"loss": 0.3391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.319928914308548,
"step": 1945,
"valid_targets_mean": 3840.0,
"valid_targets_min": 828
},
{
"epoch": 1.4874141876430205,
"grad_norm": 0.4236043917290313,
"learning_rate": 3.848159120722357e-05,
"loss": 0.3268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3326864540576935,
"step": 1950,
"valid_targets_mean": 4537.5,
"valid_targets_min": 1112
},
{
"epoch": 1.4912280701754386,
"grad_norm": 0.4598342140034555,
"learning_rate": 3.846701950094779e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3411165177822113,
"step": 1955,
"valid_targets_mean": 5026.8,
"valid_targets_min": 1170
},
{
"epoch": 1.4950419527078567,
"grad_norm": 0.41914135871574276,
"learning_rate": 3.845238099389736e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33780476450920105,
"step": 1960,
"valid_targets_mean": 5021.2,
"valid_targets_min": 952
},
{
"epoch": 1.4988558352402745,
"grad_norm": 1.3459003283983855,
"learning_rate": 3.843767573902418e-05,
"loss": 0.5818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6157845854759216,
"step": 1965,
"valid_targets_mean": 790.2,
"valid_targets_min": 583
},
{
"epoch": 1.5026697177726926,
"grad_norm": 0.4617732864123322,
"learning_rate": 3.842290378952159e-05,
"loss": 0.3401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34063920378685,
"step": 1970,
"valid_targets_mean": 4803.4,
"valid_targets_min": 839
},
{
"epoch": 1.5064836003051107,
"grad_norm": 0.531676865851445,
"learning_rate": 3.840806519882418e-05,
"loss": 0.3303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992500364780426,
"step": 1975,
"valid_targets_mean": 3430.1,
"valid_targets_min": 613
},
{
"epoch": 1.5102974828375286,
"grad_norm": 0.5226518835402676,
"learning_rate": 3.83931600206076e-05,
"loss": 0.3564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3798552453517914,
"step": 1980,
"valid_targets_mean": 3952.5,
"valid_targets_min": 1128
},
{
"epoch": 1.5141113653699465,
"grad_norm": 0.396591484196759,
"learning_rate": 3.837818830878838e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35394302010536194,
"step": 1985,
"valid_targets_mean": 6165.4,
"valid_targets_min": 1886
},
{
"epoch": 1.5179252479023646,
"grad_norm": 0.452362199986279,
"learning_rate": 3.836315011752371e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33218100666999817,
"step": 1990,
"valid_targets_mean": 5245.8,
"valid_targets_min": 1233
},
{
"epoch": 1.5217391304347827,
"grad_norm": 0.45166171439918135,
"learning_rate": 3.834804550121126e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3478414714336395,
"step": 1995,
"valid_targets_mean": 4610.8,
"valid_targets_min": 1676
},
{
"epoch": 1.5255530129672006,
"grad_norm": 0.4356146082165587,
"learning_rate": 3.8332874514488967e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3374311029911041,
"step": 2000,
"valid_targets_mean": 4473.1,
"valid_targets_min": 1297
},
{
"epoch": 1.5293668954996185,
"grad_norm": 0.44888934608269865,
"learning_rate": 3.831763721223488e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361920416355133,
"step": 2005,
"valid_targets_mean": 4083.8,
"valid_targets_min": 1411
},
{
"epoch": 1.5331807780320366,
"grad_norm": 0.4579221905167076,
"learning_rate": 3.8302333649566905e-05,
"loss": 0.3441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3255065679550171,
"step": 2010,
"valid_targets_mean": 4096.5,
"valid_targets_min": 1368
},
{
"epoch": 1.5369946605644547,
"grad_norm": 0.4458324785747194,
"learning_rate": 3.828696388184265e-05,
"loss": 0.3252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33304184675216675,
"step": 2015,
"valid_targets_mean": 4516.2,
"valid_targets_min": 1309
},
{
"epoch": 1.5408085430968725,
"grad_norm": 0.4536346386160971,
"learning_rate": 3.8271527964659174e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32771816849708557,
"step": 2020,
"valid_targets_mean": 4904.3,
"valid_targets_min": 1127
},
{
"epoch": 1.5446224256292906,
"grad_norm": 0.4831566461665685,
"learning_rate": 3.8256025953852865e-05,
"loss": 0.3323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3292129933834076,
"step": 2025,
"valid_targets_mean": 4137.0,
"valid_targets_min": 806
},
{
"epoch": 1.5484363081617087,
"grad_norm": 0.47635974507726736,
"learning_rate": 3.824045790549915e-05,
"loss": 0.366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.352607399225235,
"step": 2030,
"valid_targets_mean": 4103.1,
"valid_targets_min": 818
},
{
"epoch": 1.5522501906941266,
"grad_norm": 0.4525772248307072,
"learning_rate": 3.8224823875912356e-05,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34870848059654236,
"step": 2035,
"valid_targets_mean": 5950.1,
"valid_targets_min": 1457
},
{
"epoch": 1.5560640732265445,
"grad_norm": 0.413493930225271,
"learning_rate": 3.820912392164548e-05,
"loss": 0.3322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3418256342411041,
"step": 2040,
"valid_targets_mean": 4733.5,
"valid_targets_min": 1069
},
{
"epoch": 1.5598779557589626,
"grad_norm": 0.46894070613005195,
"learning_rate": 3.819335809949e-05,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3676106631755829,
"step": 2045,
"valid_targets_mean": 4399.0,
"valid_targets_min": 946
},
{
"epoch": 1.5636918382913807,
"grad_norm": 0.4766741967603851,
"learning_rate": 3.817752646647563e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30944350361824036,
"step": 2050,
"valid_targets_mean": 4400.2,
"valid_targets_min": 1848
},
{
"epoch": 1.5675057208237986,
"grad_norm": 0.41158705325321077,
"learning_rate": 3.816162907987016e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3295304477214813,
"step": 2055,
"valid_targets_mean": 5128.7,
"valid_targets_min": 1255
},
{
"epoch": 1.5713196033562167,
"grad_norm": 0.4284366443368262,
"learning_rate": 3.8145665997179235e-05,
"loss": 0.3517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3419044017791748,
"step": 2060,
"valid_targets_mean": 5012.1,
"valid_targets_min": 613
},
{
"epoch": 1.5751334858886348,
"grad_norm": 0.5240013370140941,
"learning_rate": 3.8129637276146134e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3423541784286499,
"step": 2065,
"valid_targets_mean": 3542.5,
"valid_targets_min": 1116
},
{
"epoch": 1.5789473684210527,
"grad_norm": 0.4615080821026482,
"learning_rate": 3.8113542974751565e-05,
"loss": 0.3488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39265763759613037,
"step": 2070,
"valid_targets_mean": 4613.8,
"valid_targets_min": 1458
},
{
"epoch": 1.5827612509534705,
"grad_norm": 0.45660629131457464,
"learning_rate": 3.809738315121347e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35427650809288025,
"step": 2075,
"valid_targets_mean": 4815.3,
"valid_targets_min": 496
},
{
"epoch": 1.5865751334858886,
"grad_norm": 0.4657806705792738,
"learning_rate": 3.8081157863986806e-05,
"loss": 0.3512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970011532306671,
"step": 2080,
"valid_targets_mean": 4139.2,
"valid_targets_min": 337
},
{
"epoch": 1.5903890160183067,
"grad_norm": 0.4365020499059465,
"learning_rate": 3.806486717176332e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30660709738731384,
"step": 2085,
"valid_targets_mean": 3980.7,
"valid_targets_min": 873
},
{
"epoch": 1.5942028985507246,
"grad_norm": 0.506656163039576,
"learning_rate": 3.8048511133471356e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4007803499698639,
"step": 2090,
"valid_targets_mean": 4447.3,
"valid_targets_min": 959
},
{
"epoch": 1.5980167810831425,
"grad_norm": 0.4751817793688682,
"learning_rate": 3.8032089808275635e-05,
"loss": 0.3237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35235536098480225,
"step": 2095,
"valid_targets_mean": 4583.0,
"valid_targets_min": 1399
},
{
"epoch": 1.6018306636155606,
"grad_norm": 0.4508540415280725,
"learning_rate": 3.801560325557703e-05,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3305545449256897,
"step": 2100,
"valid_targets_mean": 4408.1,
"valid_targets_min": 737
},
{
"epoch": 1.6056445461479787,
"grad_norm": 0.4299155016841301,
"learning_rate": 3.799905153501238e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.327955424785614,
"step": 2105,
"valid_targets_mean": 4504.2,
"valid_targets_min": 1246
},
{
"epoch": 1.6094584286803966,
"grad_norm": 0.4783710619498741,
"learning_rate": 3.798243470645425e-05,
"loss": 0.3273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33135396242141724,
"step": 2110,
"valid_targets_mean": 3603.8,
"valid_targets_min": 983
},
{
"epoch": 1.6132723112128147,
"grad_norm": 0.37927325672645257,
"learning_rate": 3.7965752830010706e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32099059224128723,
"step": 2115,
"valid_targets_mean": 5331.1,
"valid_targets_min": 1746
},
{
"epoch": 1.6170861937452328,
"grad_norm": 0.40761644497991223,
"learning_rate": 3.794900596602513e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29120543599128723,
"step": 2120,
"valid_targets_mean": 4769.4,
"valid_targets_min": 468
},
{
"epoch": 1.6209000762776506,
"grad_norm": 0.45214903550117586,
"learning_rate": 3.793219417507597e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3507181704044342,
"step": 2125,
"valid_targets_mean": 4438.9,
"valid_targets_min": 956
},
{
"epoch": 1.6247139588100685,
"grad_norm": 1.411976482155846,
"learning_rate": 3.7915317517976544e-05,
"loss": 0.5326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6349965333938599,
"step": 2130,
"valid_targets_mean": 843.3,
"valid_targets_min": 648
},
{
"epoch": 1.6285278413424866,
"grad_norm": 0.4296479124857058,
"learning_rate": 3.7898376055774806e-05,
"loss": 0.4073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31556937098503113,
"step": 2135,
"valid_targets_mean": 4938.8,
"valid_targets_min": 541
},
{
"epoch": 1.6323417238749047,
"grad_norm": 0.462970001455935,
"learning_rate": 3.788136984975313e-05,
"loss": 0.3294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3477567136287689,
"step": 2140,
"valid_targets_mean": 4699.2,
"valid_targets_min": 1459
},
{
"epoch": 1.6361556064073226,
"grad_norm": 0.48316565101860154,
"learning_rate": 3.7864298961428085e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32468631863594055,
"step": 2145,
"valid_targets_mean": 4554.4,
"valid_targets_min": 1345
},
{
"epoch": 1.6399694889397407,
"grad_norm": 0.41679333340014413,
"learning_rate": 3.784716345255022e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.336759090423584,
"step": 2150,
"valid_targets_mean": 5775.1,
"valid_targets_min": 1627
},
{
"epoch": 1.6437833714721588,
"grad_norm": 0.3953743824423388,
"learning_rate": 3.782996338510384e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29986482858657837,
"step": 2155,
"valid_targets_mean": 5298.2,
"valid_targets_min": 965
},
{
"epoch": 1.6475972540045767,
"grad_norm": 0.4736632378563593,
"learning_rate": 3.781269882130677e-05,
"loss": 0.3497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35674309730529785,
"step": 2160,
"valid_targets_mean": 4210.8,
"valid_targets_min": 1120
},
{
"epoch": 1.6514111365369946,
"grad_norm": 0.4496270825352227,
"learning_rate": 3.779536982361013e-05,
"loss": 0.3509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.352872759103775,
"step": 2165,
"valid_targets_mean": 4362.2,
"valid_targets_min": 526
},
{
"epoch": 1.6552250190694127,
"grad_norm": 0.46157964831828,
"learning_rate": 3.777797645469814e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.372890830039978,
"step": 2170,
"valid_targets_mean": 4475.5,
"valid_targets_min": 1178
},
{
"epoch": 1.6590389016018308,
"grad_norm": 0.4952894396006391,
"learning_rate": 3.776051877748785e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3195929527282715,
"step": 2175,
"valid_targets_mean": 3625.1,
"valid_targets_min": 452
},
{
"epoch": 1.6628527841342486,
"grad_norm": 0.4345556379723053,
"learning_rate": 3.774299685512894e-05,
"loss": 0.3213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3343975245952606,
"step": 2180,
"valid_targets_mean": 4466.4,
"valid_targets_min": 1113
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.42305269061244527,
"learning_rate": 3.772541075100349e-05,
"loss": 0.3361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36715126037597656,
"step": 2185,
"valid_targets_mean": 4677.8,
"valid_targets_min": 711
},
{
"epoch": 1.6704805491990846,
"grad_norm": 0.42759806624710345,
"learning_rate": 3.770776052872573e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3473476469516754,
"step": 2190,
"valid_targets_mean": 5200.2,
"valid_targets_min": 1401
},
{
"epoch": 1.6742944317315027,
"grad_norm": 0.7660926707707012,
"learning_rate": 3.7690046252141826e-05,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32988297939300537,
"step": 2195,
"valid_targets_mean": 4637.0,
"valid_targets_min": 1224
},
{
"epoch": 1.6781083142639206,
"grad_norm": 0.5055398969545535,
"learning_rate": 3.767226798532967e-05,
"loss": 0.3139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30404260754585266,
"step": 2200,
"valid_targets_mean": 4207.0,
"valid_targets_min": 709
},
{
"epoch": 1.6819221967963387,
"grad_norm": 0.4291374647287734,
"learning_rate": 3.765442579259861e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28727686405181885,
"step": 2205,
"valid_targets_mean": 4335.9,
"valid_targets_min": 510
},
{
"epoch": 1.6857360793287568,
"grad_norm": 0.46292742476924886,
"learning_rate": 3.763651973848923e-05,
"loss": 0.3143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31533995270729065,
"step": 2210,
"valid_targets_mean": 3919.2,
"valid_targets_min": 1000
},
{
"epoch": 1.6895499618611747,
"grad_norm": 0.47316186208418975,
"learning_rate": 3.761854988777312e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339639902114868,
"step": 2215,
"valid_targets_mean": 4245.3,
"valid_targets_min": 1029
},
{
"epoch": 1.6933638443935926,
"grad_norm": 0.40865623345995916,
"learning_rate": 3.760051630545264e-05,
"loss": 0.3308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192019462585449,
"step": 2220,
"valid_targets_mean": 5094.4,
"valid_targets_min": 1841
},
{
"epoch": 1.6971777269260107,
"grad_norm": 0.45723802330184893,
"learning_rate": 3.758241905676071e-05,
"loss": 0.3268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33453646302223206,
"step": 2225,
"valid_targets_mean": 3709.2,
"valid_targets_min": 423
},
{
"epoch": 1.7009916094584288,
"grad_norm": 0.4526269440545832,
"learning_rate": 3.7564258207160515e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3633545935153961,
"step": 2230,
"valid_targets_mean": 4224.0,
"valid_targets_min": 1141
},
{
"epoch": 1.7048054919908466,
"grad_norm": 0.6122509098643096,
"learning_rate": 3.754603382234533e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.307157039642334,
"step": 2235,
"valid_targets_mean": 3546.7,
"valid_targets_min": 892
},
{
"epoch": 1.7086193745232647,
"grad_norm": 0.4624666321272271,
"learning_rate": 3.752774596823825e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3046889007091522,
"step": 2240,
"valid_targets_mean": 4233.8,
"valid_targets_min": 291
},
{
"epoch": 1.7124332570556828,
"grad_norm": 0.44703143367338366,
"learning_rate": 3.750939471099194e-05,
"loss": 0.3263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33055710792541504,
"step": 2245,
"valid_targets_mean": 4348.4,
"valid_targets_min": 1155
},
{
"epoch": 1.7162471395881007,
"grad_norm": 0.4865255846967005,
"learning_rate": 3.7490980116988446e-05,
"loss": 0.3257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35459789633750916,
"step": 2250,
"valid_targets_mean": 3480.5,
"valid_targets_min": 454
},
{
"epoch": 1.7200610221205186,
"grad_norm": 0.41553778964381777,
"learning_rate": 3.747250225283889e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33044007420539856,
"step": 2255,
"valid_targets_mean": 5068.1,
"valid_targets_min": 1043
},
{
"epoch": 1.7238749046529367,
"grad_norm": 0.47247749062464844,
"learning_rate": 3.7453961185383275e-05,
"loss": 0.3174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3662593364715576,
"step": 2260,
"valid_targets_mean": 4381.7,
"valid_targets_min": 984
},
{
"epoch": 1.7276887871853548,
"grad_norm": 0.4342970807308119,
"learning_rate": 3.743535698169024e-05,
"loss": 0.3237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3155607581138611,
"step": 2265,
"valid_targets_mean": 4959.0,
"valid_targets_min": 688
},
{
"epoch": 1.7315026697177727,
"grad_norm": 0.4835822940202946,
"learning_rate": 3.741668970905678e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3475397527217865,
"step": 2270,
"valid_targets_mean": 4047.2,
"valid_targets_min": 924
},
{
"epoch": 1.7353165522501905,
"grad_norm": 0.4143882838773366,
"learning_rate": 3.739795943500807e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3046738803386688,
"step": 2275,
"valid_targets_mean": 4457.8,
"valid_targets_min": 1307
},
{
"epoch": 1.7391304347826086,
"grad_norm": 0.47715588140017007,
"learning_rate": 3.7379166227297134e-05,
"loss": 0.3337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36505427956581116,
"step": 2280,
"valid_targets_mean": 4550.1,
"valid_targets_min": 1258
},
{
"epoch": 1.7429443173150267,
"grad_norm": 0.47746507980133923,
"learning_rate": 3.7360310153904676e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3104887306690216,
"step": 2285,
"valid_targets_mean": 4238.9,
"valid_targets_min": 1358
},
{
"epoch": 1.7467581998474446,
"grad_norm": 0.4366855078559095,
"learning_rate": 3.73413912830388e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3296510577201843,
"step": 2290,
"valid_targets_mean": 4354.8,
"valid_targets_min": 1124
},
{
"epoch": 1.7505720823798627,
"grad_norm": 1.5920308734552946,
"learning_rate": 3.7322409683134754e-05,
"loss": 0.4648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6426330208778381,
"step": 2295,
"valid_targets_mean": 798.7,
"valid_targets_min": 662
},
{
"epoch": 1.7543859649122808,
"grad_norm": 0.4334877061500335,
"learning_rate": 3.730336542285471e-05,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.326994389295578,
"step": 2300,
"valid_targets_mean": 4903.4,
"valid_targets_min": 1525
},
{
"epoch": 1.7581998474446987,
"grad_norm": 0.49634867580345554,
"learning_rate": 3.7284258571087485e-05,
"loss": 0.3233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30348965525627136,
"step": 2305,
"valid_targets_mean": 3528.3,
"valid_targets_min": 1120
},
{
"epoch": 1.7620137299771166,
"grad_norm": 0.49812732348341127,
"learning_rate": 3.726508919694834e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.314765602350235,
"step": 2310,
"valid_targets_mean": 3092.0,
"valid_targets_min": 1160
},
{
"epoch": 1.7658276125095347,
"grad_norm": 0.5244174030752281,
"learning_rate": 3.724585736977867e-05,
"loss": 0.3391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3550000488758087,
"step": 2315,
"valid_targets_mean": 4437.4,
"valid_targets_min": 1185
},
{
"epoch": 1.7696414950419528,
"grad_norm": 0.4093823038328312,
"learning_rate": 3.722656315914579e-05,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3699674606323242,
"step": 2320,
"valid_targets_mean": 5781.1,
"valid_targets_min": 1382
},
{
"epoch": 1.7734553775743707,
"grad_norm": 0.4082424315818475,
"learning_rate": 3.7207206634842664e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2742947041988373,
"step": 2325,
"valid_targets_mean": 5018.0,
"valid_targets_min": 1360
},
{
"epoch": 1.7772692601067888,
"grad_norm": 0.4250104636252426,
"learning_rate": 3.7187787866887685e-05,
"loss": 0.3316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3289525508880615,
"step": 2330,
"valid_targets_mean": 4318.1,
"valid_targets_min": 1018
},
{
"epoch": 1.7810831426392069,
"grad_norm": 0.45335953265388873,
"learning_rate": 3.7168306925524385e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3171369135379791,
"step": 2335,
"valid_targets_mean": 4464.4,
"valid_targets_min": 671
},
{
"epoch": 1.7848970251716247,
"grad_norm": 0.43854487824763294,
"learning_rate": 3.71487638812212e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31873399019241333,
"step": 2340,
"valid_targets_mean": 4436.9,
"valid_targets_min": 1155
},
{
"epoch": 1.7887109077040426,
"grad_norm": 0.412063477973113,
"learning_rate": 3.712915880467121e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3235747218132019,
"step": 2345,
"valid_targets_mean": 5156.3,
"valid_targets_min": 1447
},
{
"epoch": 1.7925247902364607,
"grad_norm": 0.4389626587211984,
"learning_rate": 3.7109491766791886e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3347223997116089,
"step": 2350,
"valid_targets_mean": 4220.4,
"valid_targets_min": 834
},
{
"epoch": 1.7963386727688788,
"grad_norm": 0.43041614373722964,
"learning_rate": 3.708976283872483e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.302156001329422,
"step": 2355,
"valid_targets_mean": 4227.2,
"valid_targets_min": 867
},
{
"epoch": 1.8001525553012967,
"grad_norm": 0.4264746043330624,
"learning_rate": 3.706997209183552e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3170943558216095,
"step": 2360,
"valid_targets_mean": 4943.4,
"valid_targets_min": 871
},
{
"epoch": 1.8039664378337146,
"grad_norm": 0.4435488437349904,
"learning_rate": 3.705011959771306e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009158670902252,
"step": 2365,
"valid_targets_mean": 4024.0,
"valid_targets_min": 1455
},
{
"epoch": 1.8077803203661327,
"grad_norm": 0.40895192075459724,
"learning_rate": 3.7030205428169887e-05,
"loss": 0.3415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3293893039226532,
"step": 2370,
"valid_targets_mean": 5075.9,
"valid_targets_min": 1286
},
{
"epoch": 1.8115942028985508,
"grad_norm": 0.41660708290497744,
"learning_rate": 3.701022965524156e-05,
"loss": 0.335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31239140033721924,
"step": 2375,
"valid_targets_mean": 4275.4,
"valid_targets_min": 1051
},
{
"epoch": 1.8154080854309687,
"grad_norm": 0.4453736647599715,
"learning_rate": 3.6990192351186475e-05,
"loss": 0.3182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3469693958759308,
"step": 2380,
"valid_targets_mean": 4513.8,
"valid_targets_min": 1277
},
{
"epoch": 1.8192219679633868,
"grad_norm": 0.46119885811553796,
"learning_rate": 3.6970093588485594e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27816879749298096,
"step": 2385,
"valid_targets_mean": 3789.4,
"valid_targets_min": 1465
},
{
"epoch": 1.8230358504958049,
"grad_norm": 0.4291482862044303,
"learning_rate": 3.694993343984221e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3009355068206787,
"step": 2390,
"valid_targets_mean": 4632.9,
"valid_targets_min": 1292
},
{
"epoch": 1.8268497330282227,
"grad_norm": 0.5478615406961075,
"learning_rate": 3.692971197818164e-05,
"loss": 0.3365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3457231819629669,
"step": 2395,
"valid_targets_mean": 3948.9,
"valid_targets_min": 993
},
{
"epoch": 1.8306636155606406,
"grad_norm": 0.479894949737753,
"learning_rate": 3.6909429276651005e-05,
"loss": 0.3414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3317417800426483,
"step": 2400,
"valid_targets_mean": 4785.0,
"valid_targets_min": 986
},
{
"epoch": 1.8344774980930587,
"grad_norm": 0.4285777476400902,
"learning_rate": 3.688908540861896e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31536248326301575,
"step": 2405,
"valid_targets_mean": 4312.8,
"valid_targets_min": 1685
},
{
"epoch": 1.8382913806254768,
"grad_norm": 0.4375917603899561,
"learning_rate": 3.68686804476754e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3218797743320465,
"step": 2410,
"valid_targets_mean": 4685.2,
"valid_targets_min": 1185
},
{
"epoch": 1.8421052631578947,
"grad_norm": 0.5273066457088933,
"learning_rate": 3.684821446763121e-05,
"loss": 0.3396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39353689551353455,
"step": 2415,
"valid_targets_mean": 4030.5,
"valid_targets_min": 1191
},
{
"epoch": 1.8459191456903128,
"grad_norm": 0.4440672321044689,
"learning_rate": 3.682768754251803e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948742210865021,
"step": 2420,
"valid_targets_mean": 4679.3,
"valid_targets_min": 1334
},
{
"epoch": 1.849733028222731,
"grad_norm": 0.4782127118356837,
"learning_rate": 3.680709974658792e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35153254866600037,
"step": 2425,
"valid_targets_mean": 4014.6,
"valid_targets_min": 991
},
{
"epoch": 1.8535469107551488,
"grad_norm": 0.44745555716907837,
"learning_rate": 3.678645115431313e-05,
"loss": 0.3384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34888049960136414,
"step": 2430,
"valid_targets_mean": 5085.6,
"valid_targets_min": 1168
},
{
"epoch": 1.8573607932875666,
"grad_norm": 0.4665568435081105,
"learning_rate": 3.6765741840385865e-05,
"loss": 0.3277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34056076407432556,
"step": 2435,
"valid_targets_mean": 4100.6,
"valid_targets_min": 927
},
{
"epoch": 1.8611746758199847,
"grad_norm": 0.41128691480695334,
"learning_rate": 3.674497187971794e-05,
"loss": 0.3415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34780147671699524,
"step": 2440,
"valid_targets_mean": 5574.4,
"valid_targets_min": 713
},
{
"epoch": 1.8649885583524028,
"grad_norm": 0.4746141475032033,
"learning_rate": 3.6724141347440564e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898326814174652,
"step": 2445,
"valid_targets_mean": 3968.1,
"valid_targets_min": 523
},
{
"epoch": 1.8688024408848207,
"grad_norm": 0.5670987020490634,
"learning_rate": 3.6703250318904044e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3524753749370575,
"step": 2450,
"valid_targets_mean": 3708.4,
"valid_targets_min": 704
},
{
"epoch": 1.8726163234172386,
"grad_norm": 0.4486880722932088,
"learning_rate": 3.6682298869677534e-05,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32234349846839905,
"step": 2455,
"valid_targets_mean": 4402.6,
"valid_targets_min": 1164
},
{
"epoch": 1.8764302059496567,
"grad_norm": 1.3784929400623749,
"learning_rate": 3.666128707554874e-05,
"loss": 0.4908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6172937750816345,
"step": 2460,
"valid_targets_mean": 874.1,
"valid_targets_min": 602
},
{
"epoch": 1.8802440884820748,
"grad_norm": 0.4825156091808825,
"learning_rate": 3.664021501252365e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34351110458374023,
"step": 2465,
"valid_targets_mean": 3739.3,
"valid_targets_min": 886
},
{
"epoch": 1.8840579710144927,
"grad_norm": 0.43231635726104817,
"learning_rate": 3.661908275682626e-05,
"loss": 0.3175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3112673759460449,
"step": 2470,
"valid_targets_mean": 4797.2,
"valid_targets_min": 858
},
{
"epoch": 1.8878718535469108,
"grad_norm": 0.4389419887999067,
"learning_rate": 3.659789038489832e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3528638780117035,
"step": 2475,
"valid_targets_mean": 4661.2,
"valid_targets_min": 844
},
{
"epoch": 1.8916857360793289,
"grad_norm": 0.4063170356085659,
"learning_rate": 3.657663797339902e-05,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3472946584224701,
"step": 2480,
"valid_targets_mean": 5096.3,
"valid_targets_min": 1602
},
{
"epoch": 1.8954996186117468,
"grad_norm": 0.4473609779628171,
"learning_rate": 3.655532559920474e-05,
"loss": 0.3346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35601258277893066,
"step": 2485,
"valid_targets_mean": 4471.4,
"valid_targets_min": 473
},
{
"epoch": 1.8993135011441646,
"grad_norm": 0.510089392544064,
"learning_rate": 3.653395333940875e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3393765985965729,
"step": 2490,
"valid_targets_mean": 3695.0,
"valid_targets_min": 1341
},
{
"epoch": 1.9031273836765827,
"grad_norm": 0.4163060605293795,
"learning_rate": 3.651252127132097e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34253692626953125,
"step": 2495,
"valid_targets_mean": 5056.7,
"valid_targets_min": 1742
},
{
"epoch": 1.9069412662090008,
"grad_norm": 0.45275357622864393,
"learning_rate": 3.6491029472467625e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3306049704551697,
"step": 2500,
"valid_targets_mean": 4381.1,
"valid_targets_min": 1526
},
{
"epoch": 1.9107551487414187,
"grad_norm": 0.4289727513447695,
"learning_rate": 3.6469478020591046e-05,
"loss": 0.3297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31081557273864746,
"step": 2505,
"valid_targets_mean": 4142.5,
"valid_targets_min": 380
},
{
"epoch": 1.9145690312738368,
"grad_norm": 0.45198414914401847,
"learning_rate": 3.644786699364933e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3111429512500763,
"step": 2510,
"valid_targets_mean": 4001.7,
"valid_targets_min": 1419
},
{
"epoch": 1.918382913806255,
"grad_norm": 0.41966906491588385,
"learning_rate": 3.6426196469816077e-05,
"loss": 0.3287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29943111538887024,
"step": 2515,
"valid_targets_mean": 4615.5,
"valid_targets_min": 1134
},
{
"epoch": 1.9221967963386728,
"grad_norm": 0.3990234568258909,
"learning_rate": 3.6404466527480085e-05,
"loss": 0.3262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3199032247066498,
"step": 2520,
"valid_targets_mean": 5416.6,
"valid_targets_min": 1373
},
{
"epoch": 1.9260106788710907,
"grad_norm": 0.4100126062269341,
"learning_rate": 3.638267724524512e-05,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3309996426105499,
"step": 2525,
"valid_targets_mean": 4957.5,
"valid_targets_min": 1516
},
{
"epoch": 1.9298245614035088,
"grad_norm": 0.48930595113950065,
"learning_rate": 3.636082870192957e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3737516403198242,
"step": 2530,
"valid_targets_mean": 4311.6,
"valid_targets_min": 1513
},
{
"epoch": 1.9336384439359269,
"grad_norm": 0.396990511331678,
"learning_rate": 3.6338920976566206e-05,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.316019207239151,
"step": 2535,
"valid_targets_mean": 4857.2,
"valid_targets_min": 447
},
{
"epoch": 1.9374523264683448,
"grad_norm": 0.42707664137047063,
"learning_rate": 3.631695414840188e-05,
"loss": 0.3285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2827240526676178,
"step": 2540,
"valid_targets_mean": 4249.3,
"valid_targets_min": 1203
},
{
"epoch": 1.9412662090007626,
"grad_norm": 0.39704121969088363,
"learning_rate": 3.629492829689722e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3076905310153961,
"step": 2545,
"valid_targets_mean": 5482.1,
"valid_targets_min": 1125
},
{
"epoch": 1.9450800915331807,
"grad_norm": 0.489030926911963,
"learning_rate": 3.627284350172637e-05,
"loss": 0.3348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3305893838405609,
"step": 2550,
"valid_targets_mean": 4072.5,
"valid_targets_min": 1354
},
{
"epoch": 1.9488939740655988,
"grad_norm": 0.4784627205409548,
"learning_rate": 3.625069984277669e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30123528838157654,
"step": 2555,
"valid_targets_mean": 3369.6,
"valid_targets_min": 827
},
{
"epoch": 1.9527078565980167,
"grad_norm": 0.5780502983031945,
"learning_rate": 3.622849740014846e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978937327861786,
"step": 2560,
"valid_targets_mean": 3833.6,
"valid_targets_min": 883
},
{
"epoch": 1.9565217391304348,
"grad_norm": 0.4596843365698298,
"learning_rate": 3.620623625415462e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30321425199508667,
"step": 2565,
"valid_targets_mean": 4876.5,
"valid_targets_min": 1284
},
{
"epoch": 1.960335621662853,
"grad_norm": 0.49794938194155713,
"learning_rate": 3.618391648532043e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3527390658855438,
"step": 2570,
"valid_targets_mean": 4544.0,
"valid_targets_min": 1082
},
{
"epoch": 1.9641495041952708,
"grad_norm": 0.4306105153001951,
"learning_rate": 3.616153817438323e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867111265659332,
"step": 2575,
"valid_targets_mean": 4612.7,
"valid_targets_min": 1333
},
{
"epoch": 1.9679633867276887,
"grad_norm": 0.5634464378301066,
"learning_rate": 3.613910140229212e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3393392860889435,
"step": 2580,
"valid_targets_mean": 3495.5,
"valid_targets_min": 620
},
{
"epoch": 1.9717772692601068,
"grad_norm": 0.42643538618721466,
"learning_rate": 3.6116606250207646e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.314686119556427,
"step": 2585,
"valid_targets_mean": 4382.7,
"valid_targets_min": 505
},
{
"epoch": 1.9755911517925249,
"grad_norm": 0.461418186680906,
"learning_rate": 3.609405279950157e-05,
"loss": 0.3238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3472661077976227,
"step": 2590,
"valid_targets_mean": 3919.9,
"valid_targets_min": 1075
},
{
"epoch": 1.9794050343249427,
"grad_norm": 0.46477198331279196,
"learning_rate": 3.607144113175652e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31344321370124817,
"step": 2595,
"valid_targets_mean": 3753.2,
"valid_targets_min": 753
},
{
"epoch": 1.9832189168573608,
"grad_norm": 0.4705572499094467,
"learning_rate": 3.6048771328765695e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3468952476978302,
"step": 2600,
"valid_targets_mean": 3563.1,
"valid_targets_min": 521
},
{
"epoch": 1.987032799389779,
"grad_norm": 0.4894559516834718,
"learning_rate": 3.602604347253262e-05,
"loss": 0.3281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3458186089992523,
"step": 2605,
"valid_targets_mean": 4363.7,
"valid_targets_min": 447
},
{
"epoch": 1.9908466819221968,
"grad_norm": 0.4430488468498321,
"learning_rate": 3.600325764527079e-05,
"loss": 0.3227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3441220819950104,
"step": 2610,
"valid_targets_mean": 4790.8,
"valid_targets_min": 915
},
{
"epoch": 1.9946605644546147,
"grad_norm": 0.48404364026741203,
"learning_rate": 3.598041392940342e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2899083197116852,
"step": 2615,
"valid_targets_mean": 3817.0,
"valid_targets_min": 1202
},
{
"epoch": 1.9984744469870328,
"grad_norm": 1.695860308561902,
"learning_rate": 3.5957512407563105e-05,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6421945095062256,
"step": 2620,
"valid_targets_mean": 780.0,
"valid_targets_min": 493
},
{
"epoch": 2.002288329519451,
"grad_norm": 0.4518557790697791,
"learning_rate": 3.593455316259155e-05,
"loss": 0.4355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28681135177612305,
"step": 2625,
"valid_targets_mean": 4816.6,
"valid_targets_min": 1551
},
{
"epoch": 2.006102212051869,
"grad_norm": 0.44782126292756547,
"learning_rate": 3.591153627753927e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092162013053894,
"step": 2630,
"valid_targets_mean": 4868.9,
"valid_targets_min": 1506
},
{
"epoch": 2.0099160945842867,
"grad_norm": 0.527863530413975,
"learning_rate": 3.588846183566527e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203107416629791,
"step": 2635,
"valid_targets_mean": 3651.8,
"valid_targets_min": 728
},
{
"epoch": 2.013729977116705,
"grad_norm": 0.4487355300143573,
"learning_rate": 3.586532992043677e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3486725986003876,
"step": 2640,
"valid_targets_mean": 4654.1,
"valid_targets_min": 1003
},
{
"epoch": 2.017543859649123,
"grad_norm": 0.4149528992346252,
"learning_rate": 3.584214061552886e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30172497034072876,
"step": 2645,
"valid_targets_mean": 4589.0,
"valid_targets_min": 364
},
{
"epoch": 2.0213577421815407,
"grad_norm": 0.4380270269367264,
"learning_rate": 3.581889400482425e-05,
"loss": 0.3305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3232972025871277,
"step": 2650,
"valid_targets_mean": 4193.9,
"valid_targets_min": 1205
},
{
"epoch": 2.0251716247139586,
"grad_norm": 0.44838457623258393,
"learning_rate": 3.5795590172412946e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3213779926300049,
"step": 2655,
"valid_targets_mean": 5098.0,
"valid_targets_min": 1071
},
{
"epoch": 2.028985507246377,
"grad_norm": 0.45016704498329,
"learning_rate": 3.5772229202591926e-05,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3524353504180908,
"step": 2660,
"valid_targets_mean": 4527.9,
"valid_targets_min": 1649
},
{
"epoch": 2.032799389778795,
"grad_norm": 0.4465006685050878,
"learning_rate": 3.574881117986486e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3029600977897644,
"step": 2665,
"valid_targets_mean": 3735.4,
"valid_targets_min": 601
},
{
"epoch": 2.0366132723112127,
"grad_norm": 0.4422827681174769,
"learning_rate": 3.5725336188941785e-05,
"loss": 0.2975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2614348232746124,
"step": 2670,
"valid_targets_mean": 4119.3,
"valid_targets_min": 668
},
{
"epoch": 2.040427154843631,
"grad_norm": 0.4482051429709076,
"learning_rate": 3.570180431473883e-05,
"loss": 0.3153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3411577641963959,
"step": 2675,
"valid_targets_mean": 4912.2,
"valid_targets_min": 955
},
{
"epoch": 2.044241037376049,
"grad_norm": 0.4869196336236238,
"learning_rate": 3.567821564237787e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34559619426727295,
"step": 2680,
"valid_targets_mean": 3815.8,
"valid_targets_min": 1018
},
{
"epoch": 2.0480549199084668,
"grad_norm": 0.4897608405458026,
"learning_rate": 3.565457025718624e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3251894414424896,
"step": 2685,
"valid_targets_mean": 3756.0,
"valid_targets_min": 814
},
{
"epoch": 2.0518688024408847,
"grad_norm": 0.3818311129689496,
"learning_rate": 3.563086824469642e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27594801783561707,
"step": 2690,
"valid_targets_mean": 5182.2,
"valid_targets_min": 1313
},
{
"epoch": 2.055682684973303,
"grad_norm": 0.40078657159991377,
"learning_rate": 3.560710969064574e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34894654154777527,
"step": 2695,
"valid_targets_mean": 5636.0,
"valid_targets_min": 1050
},
{
"epoch": 2.059496567505721,
"grad_norm": 0.4314520672830342,
"learning_rate": 3.558329468097604e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30594441294670105,
"step": 2700,
"valid_targets_mean": 4584.9,
"valid_targets_min": 626
},
{
"epoch": 2.0633104500381387,
"grad_norm": 0.4330320629369986,
"learning_rate": 3.555942330183341e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33816561102867126,
"step": 2705,
"valid_targets_mean": 5605.0,
"valid_targets_min": 1122
},
{
"epoch": 2.0671243325705566,
"grad_norm": 0.432663280927747,
"learning_rate": 3.553549563956779e-05,
"loss": 0.3254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2950657904148102,
"step": 2710,
"valid_targets_mean": 4556.0,
"valid_targets_min": 764
},
{
"epoch": 2.070938215102975,
"grad_norm": 0.3980785685365819,
"learning_rate": 3.551151178073276e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.351774126291275,
"step": 2715,
"valid_targets_mean": 5619.8,
"valid_targets_min": 535
},
{
"epoch": 2.074752097635393,
"grad_norm": 0.42705954615047537,
"learning_rate": 3.548747181208516e-05,
"loss": 0.3194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2942444086074829,
"step": 2720,
"valid_targets_mean": 4475.0,
"valid_targets_min": 337
},
{
"epoch": 2.0785659801678107,
"grad_norm": 0.4250243681722831,
"learning_rate": 3.5463375820584826e-05,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3257274925708771,
"step": 2725,
"valid_targets_mean": 4989.0,
"valid_targets_min": 816
},
{
"epoch": 2.082379862700229,
"grad_norm": 0.4781865116161094,
"learning_rate": 3.5439223893394185e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36427298188209534,
"step": 2730,
"valid_targets_mean": 3891.9,
"valid_targets_min": 989
},
{
"epoch": 2.086193745232647,
"grad_norm": 0.432991181042828,
"learning_rate": 3.541501611787806e-05,
"loss": 0.3269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29490405321121216,
"step": 2735,
"valid_targets_mean": 4064.3,
"valid_targets_min": 1512
},
{
"epoch": 2.0900076277650648,
"grad_norm": 0.4358409077212192,
"learning_rate": 3.5390752581603256e-05,
"loss": 0.3241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3720548152923584,
"step": 2740,
"valid_targets_mean": 5014.2,
"valid_targets_min": 1590
},
{
"epoch": 2.0938215102974826,
"grad_norm": 0.4051452760209203,
"learning_rate": 3.536643337233831e-05,
"loss": 0.3314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32935160398483276,
"step": 2745,
"valid_targets_mean": 5356.0,
"valid_targets_min": 563
},
{
"epoch": 2.097635392829901,
"grad_norm": 0.4618577711694058,
"learning_rate": 3.5342058578053115e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31700313091278076,
"step": 2750,
"valid_targets_mean": 4074.1,
"valid_targets_min": 1113
},
{
"epoch": 2.101449275362319,
"grad_norm": 0.4650533706947534,
"learning_rate": 3.5317628286918654e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3038328289985657,
"step": 2755,
"valid_targets_mean": 3777.7,
"valid_targets_min": 1051
},
{
"epoch": 2.1052631578947367,
"grad_norm": 0.3911911315347162,
"learning_rate": 3.5293142587306656e-05,
"loss": 0.3206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3163069784641266,
"step": 2760,
"valid_targets_mean": 5114.2,
"valid_targets_min": 1244
},
{
"epoch": 2.109077040427155,
"grad_norm": 0.4528620401506649,
"learning_rate": 3.526860156778927e-05,
"loss": 0.3408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3514285981655121,
"step": 2765,
"valid_targets_mean": 3839.7,
"valid_targets_min": 1011
},
{
"epoch": 2.112890922959573,
"grad_norm": 0.4177167860467384,
"learning_rate": 3.524400531713876e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3051723837852478,
"step": 2770,
"valid_targets_mean": 5298.1,
"valid_targets_min": 1803
},
{
"epoch": 2.116704805491991,
"grad_norm": 0.4003676926723766,
"learning_rate": 3.521935392432718e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31541749835014343,
"step": 2775,
"valid_targets_mean": 4743.7,
"valid_targets_min": 1137
},
{
"epoch": 2.1205186880244087,
"grad_norm": 0.4520780702808259,
"learning_rate": 3.5194647478526044e-05,
"loss": 0.3177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31706899404525757,
"step": 2780,
"valid_targets_mean": 4706.4,
"valid_targets_min": 267
},
{
"epoch": 2.124332570556827,
"grad_norm": 1.4925281950577982,
"learning_rate": 3.5169886069106015e-05,
"loss": 0.5112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.637296736240387,
"step": 2785,
"valid_targets_mean": 864.1,
"valid_targets_min": 587
},
{
"epoch": 2.128146453089245,
"grad_norm": 0.4277812995302766,
"learning_rate": 3.5145069785636576e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34565839171409607,
"step": 2790,
"valid_targets_mean": 4901.5,
"valid_targets_min": 1024
},
{
"epoch": 2.1319603356216628,
"grad_norm": 0.4339866826762552,
"learning_rate": 3.512019871788569e-05,
"loss": 0.33,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3311890661716461,
"step": 2795,
"valid_targets_mean": 4585.2,
"valid_targets_min": 803
},
{
"epoch": 2.135774218154081,
"grad_norm": 0.44356752428059937,
"learning_rate": 3.509527295581951e-05,
"loss": 0.33,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34069275856018066,
"step": 2800,
"valid_targets_mean": 5747.2,
"valid_targets_min": 1140
},
{
"epoch": 2.139588100686499,
"grad_norm": 0.48873464445289144,
"learning_rate": 3.507029258960203e-05,
"loss": 0.3185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361491858959198,
"step": 2805,
"valid_targets_mean": 5306.7,
"valid_targets_min": 1462
},
{
"epoch": 2.143401983218917,
"grad_norm": 0.40843884861087065,
"learning_rate": 3.504525770959477e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.345804363489151,
"step": 2810,
"valid_targets_mean": 5229.5,
"valid_targets_min": 375
},
{
"epoch": 2.1472158657513347,
"grad_norm": 0.4304445901977957,
"learning_rate": 3.502016840635642e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32236722111701965,
"step": 2815,
"valid_targets_mean": 4655.3,
"valid_targets_min": 1315
},
{
"epoch": 2.151029748283753,
"grad_norm": 0.42379821089500375,
"learning_rate": 3.4995024770642554e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3316449224948883,
"step": 2820,
"valid_targets_mean": 4426.3,
"valid_targets_min": 1482
},
{
"epoch": 2.154843630816171,
"grad_norm": 0.41185583474074233,
"learning_rate": 3.4969826893405294e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34358730912208557,
"step": 2825,
"valid_targets_mean": 5202.3,
"valid_targets_min": 1354
},
{
"epoch": 2.158657513348589,
"grad_norm": 0.44266026669962844,
"learning_rate": 3.4944574865792945e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30736637115478516,
"step": 2830,
"valid_targets_mean": 4420.9,
"valid_targets_min": 1073
},
{
"epoch": 2.1624713958810067,
"grad_norm": 0.4061991514677841,
"learning_rate": 3.4919268779149696e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31193986535072327,
"step": 2835,
"valid_targets_mean": 4632.8,
"valid_targets_min": 1249
},
{
"epoch": 2.166285278413425,
"grad_norm": 0.43478104011120616,
"learning_rate": 3.489390872501529e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3487791121006012,
"step": 2840,
"valid_targets_mean": 4533.8,
"valid_targets_min": 1392
},
{
"epoch": 2.170099160945843,
"grad_norm": 0.4078062523633683,
"learning_rate": 3.4868494795124705e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3065103590488434,
"step": 2845,
"valid_targets_mean": 4814.8,
"valid_targets_min": 763
},
{
"epoch": 2.1739130434782608,
"grad_norm": 0.4289713522809232,
"learning_rate": 3.484302708140775e-05,
"loss": 0.3041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33483967185020447,
"step": 2850,
"valid_targets_mean": 4179.2,
"valid_targets_min": 1051
},
{
"epoch": 2.177726926010679,
"grad_norm": 0.472220403001625,
"learning_rate": 3.481750567598885e-05,
"loss": 0.3223,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.362771600484848,
"step": 2855,
"valid_targets_mean": 4404.5,
"valid_targets_min": 1088
},
{
"epoch": 2.181540808543097,
"grad_norm": 0.3648207114064372,
"learning_rate": 3.47919306711866e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2925264835357666,
"step": 2860,
"valid_targets_mean": 5416.4,
"valid_targets_min": 1482
},
{
"epoch": 2.185354691075515,
"grad_norm": 0.39372615878666817,
"learning_rate": 3.4766302159513514e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31346771121025085,
"step": 2865,
"valid_targets_mean": 5427.8,
"valid_targets_min": 1130
},
{
"epoch": 2.1891685736079327,
"grad_norm": 0.4126857886832629,
"learning_rate": 3.474062023367563e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3509589433670044,
"step": 2870,
"valid_targets_mean": 5269.3,
"valid_targets_min": 991
},
{
"epoch": 2.192982456140351,
"grad_norm": 0.411651571169999,
"learning_rate": 3.471488498657222e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3311251401901245,
"step": 2875,
"valid_targets_mean": 5288.4,
"valid_targets_min": 763
},
{
"epoch": 2.196796338672769,
"grad_norm": 0.44636044736979674,
"learning_rate": 3.468909651129543e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3214028775691986,
"step": 2880,
"valid_targets_mean": 4051.4,
"valid_targets_min": 990
},
{
"epoch": 2.200610221205187,
"grad_norm": 0.4449036968288949,
"learning_rate": 3.466325490112993e-05,
"loss": 0.3097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2663789689540863,
"step": 2885,
"valid_targets_mean": 3941.7,
"valid_targets_min": 605
},
{
"epoch": 2.2044241037376047,
"grad_norm": 0.43992016755573804,
"learning_rate": 3.463736024955263e-05,
"loss": 0.3234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3127845525741577,
"step": 2890,
"valid_targets_mean": 5903.5,
"valid_targets_min": 1002
},
{
"epoch": 2.208237986270023,
"grad_norm": 0.43453745171374947,
"learning_rate": 3.461141265023229e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29881763458251953,
"step": 2895,
"valid_targets_mean": 4015.5,
"valid_targets_min": 724
},
{
"epoch": 2.212051868802441,
"grad_norm": 0.3852285397340729,
"learning_rate": 3.4585412197029176e-05,
"loss": 0.3309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29247185587882996,
"step": 2900,
"valid_targets_mean": 4694.1,
"valid_targets_min": 1035
},
{
"epoch": 2.2158657513348587,
"grad_norm": 0.5136665672114349,
"learning_rate": 3.455935898399479e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3353908956050873,
"step": 2905,
"valid_targets_mean": 4370.2,
"valid_targets_min": 1005
},
{
"epoch": 2.219679633867277,
"grad_norm": 0.4881189152233372,
"learning_rate": 3.453325310537142e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3274397552013397,
"step": 2910,
"valid_targets_mean": 4228.9,
"valid_targets_min": 1214
},
{
"epoch": 2.223493516399695,
"grad_norm": 0.4195992283622164,
"learning_rate": 3.450709465559194e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32342055439949036,
"step": 2915,
"valid_targets_mean": 4261.7,
"valid_targets_min": 919
},
{
"epoch": 2.227307398932113,
"grad_norm": 0.4159790401363364,
"learning_rate": 3.4480883729279305e-05,
"loss": 0.3543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33828291296958923,
"step": 2920,
"valid_targets_mean": 4834.0,
"valid_targets_min": 1373
},
{
"epoch": 2.2311212814645307,
"grad_norm": 0.4165223915561082,
"learning_rate": 3.445462042124636e-05,
"loss": 0.3215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3129110634326935,
"step": 2925,
"valid_targets_mean": 4497.5,
"valid_targets_min": 1123
},
{
"epoch": 2.234935163996949,
"grad_norm": 0.38466587084214765,
"learning_rate": 3.442830482649539e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339121341705322,
"step": 2930,
"valid_targets_mean": 5770.3,
"valid_targets_min": 1754
},
{
"epoch": 2.238749046529367,
"grad_norm": 0.40262584621326525,
"learning_rate": 3.440193704021783e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31021028757095337,
"step": 2935,
"valid_targets_mean": 5080.9,
"valid_targets_min": 1674
},
{
"epoch": 2.242562929061785,
"grad_norm": 0.41779524060918555,
"learning_rate": 3.4375517157793927e-05,
"loss": 0.3317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32838132977485657,
"step": 2940,
"valid_targets_mean": 4848.7,
"valid_targets_min": 1385
},
{
"epoch": 2.246376811594203,
"grad_norm": 0.4640321321894666,
"learning_rate": 3.434904527479235e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3334600031375885,
"step": 2945,
"valid_targets_mean": 4124.4,
"valid_targets_min": 1203
},
{
"epoch": 2.250190694126621,
"grad_norm": 1.2455406449672553,
"learning_rate": 3.4322521486969866e-05,
"loss": 0.5444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6027448773384094,
"step": 2950,
"valid_targets_mean": 885.0,
"valid_targets_min": 551
},
{
"epoch": 2.254004576659039,
"grad_norm": 0.4533102457871256,
"learning_rate": 3.429594589027102e-05,
"loss": 0.3982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31670811772346497,
"step": 2955,
"valid_targets_mean": 5360.8,
"valid_targets_min": 1229
},
{
"epoch": 2.2578184591914567,
"grad_norm": 0.45007990340926657,
"learning_rate": 3.426931858082775e-05,
"loss": 0.3292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27866581082344055,
"step": 2960,
"valid_targets_mean": 4068.8,
"valid_targets_min": 978
},
{
"epoch": 2.261632341723875,
"grad_norm": 0.4182475658385057,
"learning_rate": 3.4242639654959055e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33048322796821594,
"step": 2965,
"valid_targets_mean": 5333.2,
"valid_targets_min": 1035
},
{
"epoch": 2.265446224256293,
"grad_norm": 0.44982078901385464,
"learning_rate": 3.4215909209170656e-05,
"loss": 0.3364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3067856431007385,
"step": 2970,
"valid_targets_mean": 4327.3,
"valid_targets_min": 1058
},
{
"epoch": 2.269260106788711,
"grad_norm": 0.4246313159105408,
"learning_rate": 3.418912734015463e-05,
"loss": 0.3272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3462902009487152,
"step": 2975,
"valid_targets_mean": 4803.1,
"valid_targets_min": 403
},
{
"epoch": 2.273073989321129,
"grad_norm": 0.4537107473424202,
"learning_rate": 3.416229414478907e-05,
"loss": 0.3241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000136911869049,
"step": 2980,
"valid_targets_mean": 4820.1,
"valid_targets_min": 1166
},
{
"epoch": 2.276887871853547,
"grad_norm": 0.4202091063659574,
"learning_rate": 3.4135409720137725e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28874197602272034,
"step": 2985,
"valid_targets_mean": 3907.3,
"valid_targets_min": 1048
},
{
"epoch": 2.280701754385965,
"grad_norm": 0.46834762645468975,
"learning_rate": 3.4108474163449653e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35787180066108704,
"step": 2990,
"valid_targets_mean": 3768.8,
"valid_targets_min": 969
},
{
"epoch": 2.2845156369183828,
"grad_norm": 0.44621662808084633,
"learning_rate": 3.40814875721589e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3383162319660187,
"step": 2995,
"valid_targets_mean": 4347.9,
"valid_targets_min": 681
},
{
"epoch": 2.288329519450801,
"grad_norm": 0.4276744418335265,
"learning_rate": 3.405445004388408e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28751322627067566,
"step": 3000,
"valid_targets_mean": 4021.9,
"valid_targets_min": 1002
},
{
"epoch": 2.292143401983219,
"grad_norm": 0.43665377536255506,
"learning_rate": 3.402736167642809e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3026927411556244,
"step": 3005,
"valid_targets_mean": 4820.8,
"valid_targets_min": 1394
},
{
"epoch": 2.295957284515637,
"grad_norm": 0.41102468091858063,
"learning_rate": 3.400022256777772e-05,
"loss": 0.3075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29576948285102844,
"step": 3010,
"valid_targets_mean": 4581.5,
"valid_targets_min": 1097
},
{
"epoch": 2.2997711670480547,
"grad_norm": 0.38434638037208735,
"learning_rate": 3.39730328161033e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018251061439514,
"step": 3015,
"valid_targets_mean": 4958.6,
"valid_targets_min": 1754
},
{
"epoch": 2.303585049580473,
"grad_norm": 0.4335198527505541,
"learning_rate": 3.394579251975836e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2881692051887512,
"step": 3020,
"valid_targets_mean": 4141.5,
"valid_targets_min": 1515
},
{
"epoch": 2.307398932112891,
"grad_norm": 0.4124467111134283,
"learning_rate": 3.391850177727924e-05,
"loss": 0.3264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35339486598968506,
"step": 3025,
"valid_targets_mean": 5283.4,
"valid_targets_min": 1263
},
{
"epoch": 2.311212814645309,
"grad_norm": 0.4661684649657449,
"learning_rate": 3.389116068738482e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31515705585479736,
"step": 3030,
"valid_targets_mean": 4185.0,
"valid_targets_min": 492
},
{
"epoch": 2.3150266971777267,
"grad_norm": 0.435483883866706,
"learning_rate": 3.3863769348976024e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3099616467952728,
"step": 3035,
"valid_targets_mean": 4285.6,
"valid_targets_min": 712
},
{
"epoch": 2.318840579710145,
"grad_norm": 0.4489741349463335,
"learning_rate": 3.38363278611356e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31510940194129944,
"step": 3040,
"valid_targets_mean": 4578.5,
"valid_targets_min": 1220
},
{
"epoch": 2.322654462242563,
"grad_norm": 0.454132578096704,
"learning_rate": 3.3808836323127666e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31616052985191345,
"step": 3045,
"valid_targets_mean": 4476.0,
"valid_targets_min": 924
},
{
"epoch": 2.3264683447749808,
"grad_norm": 0.4706189536012141,
"learning_rate": 3.3781294834397416e-05,
"loss": 0.3202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3171687722206116,
"step": 3050,
"valid_targets_mean": 3822.8,
"valid_targets_min": 1079
},
{
"epoch": 2.330282227307399,
"grad_norm": 0.4688702774722974,
"learning_rate": 3.375370349457069e-05,
"loss": 0.3144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29751574993133545,
"step": 3055,
"valid_targets_mean": 3372.0,
"valid_targets_min": 745
},
{
"epoch": 2.334096109839817,
"grad_norm": 0.45350633325165235,
"learning_rate": 3.37260624034537e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26518234610557556,
"step": 3060,
"valid_targets_mean": 3821.1,
"valid_targets_min": 1002
},
{
"epoch": 2.337909992372235,
"grad_norm": 0.4509818679226893,
"learning_rate": 3.36983716610326e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775558531284332,
"step": 3065,
"valid_targets_mean": 3986.3,
"valid_targets_min": 1127
},
{
"epoch": 2.3417238749046527,
"grad_norm": 0.4220414814745815,
"learning_rate": 3.3670631367473136e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31039997935295105,
"step": 3070,
"valid_targets_mean": 4780.5,
"valid_targets_min": 1411
},
{
"epoch": 2.345537757437071,
"grad_norm": 0.4625202358326965,
"learning_rate": 3.364284162312032e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3140174150466919,
"step": 3075,
"valid_targets_mean": 3760.7,
"valid_targets_min": 1065
},
{
"epoch": 2.349351639969489,
"grad_norm": 0.4041288445251084,
"learning_rate": 3.361500252849803e-05,
"loss": 0.3071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2915945053100586,
"step": 3080,
"valid_targets_mean": 4437.5,
"valid_targets_min": 743
},
{
"epoch": 2.353165522501907,
"grad_norm": 0.42664167212219883,
"learning_rate": 3.3587114184308664e-05,
"loss": 0.3237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3082127869129181,
"step": 3085,
"valid_targets_mean": 4920.8,
"valid_targets_min": 566
},
{
"epoch": 2.356979405034325,
"grad_norm": 0.45595971770828464,
"learning_rate": 3.355917669143276e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.314989298582077,
"step": 3090,
"valid_targets_mean": 3974.5,
"valid_targets_min": 1242
},
{
"epoch": 2.360793287566743,
"grad_norm": 0.4267031520990776,
"learning_rate": 3.3531190150928655e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31824013590812683,
"step": 3095,
"valid_targets_mean": 4419.4,
"valid_targets_min": 1017
},
{
"epoch": 2.364607170099161,
"grad_norm": 0.40719312557802045,
"learning_rate": 3.35031546640321e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29631316661834717,
"step": 3100,
"valid_targets_mean": 4890.0,
"valid_targets_min": 1432
},
{
"epoch": 2.3684210526315788,
"grad_norm": 0.4836219301990495,
"learning_rate": 3.347507033215589e-05,
"loss": 0.3117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3056109845638275,
"step": 3105,
"valid_targets_mean": 3523.5,
"valid_targets_min": 1035
},
{
"epoch": 2.372234935163997,
"grad_norm": 0.46664455271321875,
"learning_rate": 3.344693725688953e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30344218015670776,
"step": 3110,
"valid_targets_mean": 4145.0,
"valid_targets_min": 1151
},
{
"epoch": 2.376048817696415,
"grad_norm": 0.4709941009473953,
"learning_rate": 3.341875553999883e-05,
"loss": 0.4522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29392245411872864,
"step": 3115,
"valid_targets_mean": 4008.7,
"valid_targets_min": 371
},
{
"epoch": 2.379862700228833,
"grad_norm": 0.4204995391050676,
"learning_rate": 3.339052528342554e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34602752327919006,
"step": 3120,
"valid_targets_mean": 4779.5,
"valid_targets_min": 1024
},
{
"epoch": 2.383676582761251,
"grad_norm": 0.4404868029867653,
"learning_rate": 3.336224658928702e-05,
"loss": 0.3234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3412117063999176,
"step": 3125,
"valid_targets_mean": 4316.2,
"valid_targets_min": 1087
},
{
"epoch": 2.387490465293669,
"grad_norm": 0.48253694746867987,
"learning_rate": 3.3333919559875817e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30176326632499695,
"step": 3130,
"valid_targets_mean": 3363.5,
"valid_targets_min": 1126
},
{
"epoch": 2.391304347826087,
"grad_norm": 0.47060528945887725,
"learning_rate": 3.330554429765933e-05,
"loss": 0.3056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910543978214264,
"step": 3135,
"valid_targets_mean": 4389.2,
"valid_targets_min": 1106
},
{
"epoch": 2.395118230358505,
"grad_norm": 0.40268416401652135,
"learning_rate": 3.3277120905279454e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3227095603942871,
"step": 3140,
"valid_targets_mean": 5091.1,
"valid_targets_min": 379
},
{
"epoch": 2.398932112890923,
"grad_norm": 0.5366231607872158,
"learning_rate": 3.324864948555215e-05,
"loss": 0.3059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31209537386894226,
"step": 3145,
"valid_targets_mean": 3523.9,
"valid_targets_min": 497
},
{
"epoch": 2.402745995423341,
"grad_norm": 0.46305780755530407,
"learning_rate": 3.3220130141467126e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2822486460208893,
"step": 3150,
"valid_targets_mean": 4739.7,
"valid_targets_min": 1556
},
{
"epoch": 2.406559877955759,
"grad_norm": 0.41772343288346137,
"learning_rate": 3.319156297618744e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29450178146362305,
"step": 3155,
"valid_targets_mean": 4559.1,
"valid_targets_min": 1074
},
{
"epoch": 2.410373760488177,
"grad_norm": 0.4009891297301182,
"learning_rate": 3.316294809304914e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615176737308502,
"step": 3160,
"valid_targets_mean": 4259.6,
"valid_targets_min": 320
},
{
"epoch": 2.414187643020595,
"grad_norm": 0.5372736697822601,
"learning_rate": 3.3134285595560884e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3198303282260895,
"step": 3165,
"valid_targets_mean": 4708.5,
"valid_targets_min": 1294
},
{
"epoch": 2.418001525553013,
"grad_norm": 0.5006156073841829,
"learning_rate": 3.310557558740356e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28113606572151184,
"step": 3170,
"valid_targets_mean": 3367.2,
"valid_targets_min": 773
},
{
"epoch": 2.421815408085431,
"grad_norm": 0.5394294222955758,
"learning_rate": 3.3076818172429925e-05,
"loss": 0.324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090674579143524,
"step": 3175,
"valid_targets_mean": 3041.1,
"valid_targets_min": 561
},
{
"epoch": 2.425629290617849,
"grad_norm": 0.3752343434469316,
"learning_rate": 3.304801345466421e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2914296090602875,
"step": 3180,
"valid_targets_mean": 5173.1,
"valid_targets_min": 1182
},
{
"epoch": 2.429443173150267,
"grad_norm": 0.36719834272513013,
"learning_rate": 3.301916153830175e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869374454021454,
"step": 3185,
"valid_targets_mean": 5752.6,
"valid_targets_min": 1254
},
{
"epoch": 2.433257055682685,
"grad_norm": 0.46120148501188674,
"learning_rate": 3.299026252770864e-05,
"loss": 0.3163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30976438522338867,
"step": 3190,
"valid_targets_mean": 4156.0,
"valid_targets_min": 952
},
{
"epoch": 2.437070938215103,
"grad_norm": 0.4028904691522973,
"learning_rate": 3.2961316527421297e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2804625332355499,
"step": 3195,
"valid_targets_mean": 5134.5,
"valid_targets_min": 939
},
{
"epoch": 2.440884820747521,
"grad_norm": 0.42739158339434313,
"learning_rate": 3.293232364214613e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2903222441673279,
"step": 3200,
"valid_targets_mean": 4225.7,
"valid_targets_min": 1532
},
{
"epoch": 2.444698703279939,
"grad_norm": 0.4120940942202485,
"learning_rate": 3.2903283976759154e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3225897550582886,
"step": 3205,
"valid_targets_mean": 4823.2,
"valid_targets_min": 1258
},
{
"epoch": 2.448512585812357,
"grad_norm": 0.4438438890063094,
"learning_rate": 3.287419763630557e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3097473680973053,
"step": 3210,
"valid_targets_mean": 4313.7,
"valid_targets_min": 1132
},
{
"epoch": 2.4523264683447747,
"grad_norm": 0.454562761903692,
"learning_rate": 3.284506472599946e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27896568179130554,
"step": 3215,
"valid_targets_mean": 3983.9,
"valid_targets_min": 376
},
{
"epoch": 2.456140350877193,
"grad_norm": 0.41734956806317247,
"learning_rate": 3.281588535122331e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3313711881637573,
"step": 3220,
"valid_targets_mean": 4768.2,
"valid_targets_min": 1079
},
{
"epoch": 2.459954233409611,
"grad_norm": 0.4050882230027488,
"learning_rate": 3.278665961752774e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3018350601196289,
"step": 3225,
"valid_targets_mean": 4809.2,
"valid_targets_min": 1149
},
{
"epoch": 2.463768115942029,
"grad_norm": 0.44512875562523363,
"learning_rate": 3.2757387630631015e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3171129822731018,
"step": 3230,
"valid_targets_mean": 4194.5,
"valid_targets_min": 1214
},
{
"epoch": 2.467581998474447,
"grad_norm": 0.4318883742701634,
"learning_rate": 3.272806949641875e-05,
"loss": 0.3282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30675944685935974,
"step": 3235,
"valid_targets_mean": 4495.5,
"valid_targets_min": 1280
},
{
"epoch": 2.471395881006865,
"grad_norm": 0.5127454111107679,
"learning_rate": 3.269870532094346e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.305593341588974,
"step": 3240,
"valid_targets_mean": 4044.5,
"valid_targets_min": 852
},
{
"epoch": 2.475209763539283,
"grad_norm": 0.44932328995702725,
"learning_rate": 3.2669295210424216e-05,
"loss": 0.3151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3079918920993805,
"step": 3245,
"valid_targets_mean": 4045.1,
"valid_targets_min": 829
},
{
"epoch": 2.479023646071701,
"grad_norm": 0.4248740581634684,
"learning_rate": 3.263983927124626e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3253237307071686,
"step": 3250,
"valid_targets_mean": 4557.6,
"valid_targets_min": 1362
},
{
"epoch": 2.482837528604119,
"grad_norm": 0.47524928688800416,
"learning_rate": 3.26103376099606e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33182817697525024,
"step": 3255,
"valid_targets_mean": 4120.5,
"valid_targets_min": 288
},
{
"epoch": 2.486651411136537,
"grad_norm": 0.4013284951011599,
"learning_rate": 3.258079033328362e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2935488522052765,
"step": 3260,
"valid_targets_mean": 5461.8,
"valid_targets_min": 699
},
{
"epoch": 2.490465293668955,
"grad_norm": 0.4560281553599727,
"learning_rate": 3.255119754809674e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3281641900539398,
"step": 3265,
"valid_targets_mean": 3976.6,
"valid_targets_min": 1316
},
{
"epoch": 2.494279176201373,
"grad_norm": 0.4194313669939143,
"learning_rate": 3.252155936144598e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2913791835308075,
"step": 3270,
"valid_targets_mean": 4450.8,
"valid_targets_min": 802
},
{
"epoch": 2.498093058733791,
"grad_norm": 1.2583919640663648,
"learning_rate": 3.249187588054158e-05,
"loss": 0.4749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5555517673492432,
"step": 3275,
"valid_targets_mean": 802.0,
"valid_targets_min": 573
},
{
"epoch": 2.501906941266209,
"grad_norm": 0.4182243002509812,
"learning_rate": 3.246214721275765e-05,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2573336064815521,
"step": 3280,
"valid_targets_mean": 4969.2,
"valid_targets_min": 1564
},
{
"epoch": 2.505720823798627,
"grad_norm": 0.45724501654045097,
"learning_rate": 3.2432373465631735e-05,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3165568709373474,
"step": 3285,
"valid_targets_mean": 4297.0,
"valid_targets_min": 514
},
{
"epoch": 2.509534706331045,
"grad_norm": 0.5092081567329626,
"learning_rate": 3.240255474686445e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3316061198711395,
"step": 3290,
"valid_targets_mean": 3906.4,
"valid_targets_min": 312
},
{
"epoch": 2.513348588863463,
"grad_norm": 0.4128558996686412,
"learning_rate": 3.23726911643191e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3001715838909149,
"step": 3295,
"valid_targets_mean": 4967.5,
"valid_targets_min": 1778
},
{
"epoch": 2.517162471395881,
"grad_norm": 0.3938186280656715,
"learning_rate": 3.234278282602124e-05,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615433633327484,
"step": 3300,
"valid_targets_mean": 5320.2,
"valid_targets_min": 1049
},
{
"epoch": 2.520976353928299,
"grad_norm": 0.4720418563543762,
"learning_rate": 3.231282984015835e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33653369545936584,
"step": 3305,
"valid_targets_mean": 4016.5,
"valid_targets_min": 296
},
{
"epoch": 2.524790236460717,
"grad_norm": 0.4267496748398417,
"learning_rate": 3.228283231507942e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33910393714904785,
"step": 3310,
"valid_targets_mean": 4726.3,
"valid_targets_min": 964
},
{
"epoch": 2.528604118993135,
"grad_norm": 0.4311391044080387,
"learning_rate": 3.225279035929452e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865217924118042,
"step": 3315,
"valid_targets_mean": 4205.9,
"valid_targets_min": 1404
},
{
"epoch": 2.532418001525553,
"grad_norm": 0.43520655150199683,
"learning_rate": 3.222270408147447e-05,
"loss": 0.3165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3108452558517456,
"step": 3320,
"valid_targets_mean": 3981.0,
"valid_targets_min": 1039
},
{
"epoch": 2.536231884057971,
"grad_norm": 0.41681559543008706,
"learning_rate": 3.219257359045039e-05,
"loss": 0.2954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192494213581085,
"step": 3325,
"valid_targets_mean": 4327.1,
"valid_targets_min": 1317
},
{
"epoch": 2.540045766590389,
"grad_norm": 0.4184490891131059,
"learning_rate": 3.2162398995213355e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3283292353153229,
"step": 3330,
"valid_targets_mean": 4665.3,
"valid_targets_min": 1543
},
{
"epoch": 2.543859649122807,
"grad_norm": 0.4100215088411221,
"learning_rate": 3.213218040491397e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32542848587036133,
"step": 3335,
"valid_targets_mean": 5202.1,
"valid_targets_min": 1795
},
{
"epoch": 2.5476735316552253,
"grad_norm": 0.4581780551039809,
"learning_rate": 3.2101917928861986e-05,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3427410423755646,
"step": 3340,
"valid_targets_mean": 4036.1,
"valid_targets_min": 729
},
{
"epoch": 2.551487414187643,
"grad_norm": 0.46035481912473103,
"learning_rate": 3.207161167652589e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007487952709198,
"step": 3345,
"valid_targets_mean": 4143.8,
"valid_targets_min": 894
},
{
"epoch": 2.555301296720061,
"grad_norm": 0.4034052276373605,
"learning_rate": 3.204126175753253e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30226239562034607,
"step": 3350,
"valid_targets_mean": 4929.1,
"valid_targets_min": 859
},
{
"epoch": 2.559115179252479,
"grad_norm": 0.45042067980684486,
"learning_rate": 3.201086828166672e-05,
"loss": 0.313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30956992506980896,
"step": 3355,
"valid_targets_mean": 3947.8,
"valid_targets_min": 300
},
{
"epoch": 2.5629290617848968,
"grad_norm": 0.4208797502147041,
"learning_rate": 3.1980431358870805e-05,
"loss": 0.3331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3373583257198334,
"step": 3360,
"valid_targets_mean": 5164.8,
"valid_targets_min": 1035
},
{
"epoch": 2.566742944317315,
"grad_norm": 0.4139965067629496,
"learning_rate": 3.1949951099244326e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26954910159111023,
"step": 3365,
"valid_targets_mean": 4530.2,
"valid_targets_min": 1172
},
{
"epoch": 2.570556826849733,
"grad_norm": 0.4073002785523478,
"learning_rate": 3.191942761304355e-05,
"loss": 0.3225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845797538757324,
"step": 3370,
"valid_targets_mean": 5883.5,
"valid_targets_min": 1762
},
{
"epoch": 2.5743707093821513,
"grad_norm": 0.5005794736670965,
"learning_rate": 3.188886101068113e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33116093277931213,
"step": 3375,
"valid_targets_mean": 3936.8,
"valid_targets_min": 972
},
{
"epoch": 2.578184591914569,
"grad_norm": 0.39563461531335153,
"learning_rate": 3.185825140272569e-05,
"loss": 0.3134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31638863682746887,
"step": 3380,
"valid_targets_mean": 5078.9,
"valid_targets_min": 946
},
{
"epoch": 2.581998474446987,
"grad_norm": 0.38103153537461776,
"learning_rate": 3.1827598899901384e-05,
"loss": 0.3197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32187706232070923,
"step": 3385,
"valid_targets_mean": 5218.0,
"valid_targets_min": 1187
},
{
"epoch": 2.585812356979405,
"grad_norm": 0.4592422549331716,
"learning_rate": 3.179690361308757e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3470957279205322,
"step": 3390,
"valid_targets_mean": 4527.9,
"valid_targets_min": 498
},
{
"epoch": 2.589626239511823,
"grad_norm": 0.4242232229533466,
"learning_rate": 3.1766165653318354e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3074164390563965,
"step": 3395,
"valid_targets_mean": 4345.0,
"valid_targets_min": 933
},
{
"epoch": 2.593440122044241,
"grad_norm": 0.4249779377292946,
"learning_rate": 3.173538513178218e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2875068187713623,
"step": 3400,
"valid_targets_mean": 4543.5,
"valid_targets_min": 1172
},
{
"epoch": 2.597254004576659,
"grad_norm": 0.4274365869571573,
"learning_rate": 3.170456215982149e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30450737476348877,
"step": 3405,
"valid_targets_mean": 4374.2,
"valid_targets_min": 1202
},
{
"epoch": 2.601067887109077,
"grad_norm": 0.45198819209554214,
"learning_rate": 3.167369684893224e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29094013571739197,
"step": 3410,
"valid_targets_mean": 4171.3,
"valid_targets_min": 607
},
{
"epoch": 2.604881769641495,
"grad_norm": 0.3965480485903044,
"learning_rate": 3.164278931076358e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770211398601532,
"step": 3415,
"valid_targets_mean": 5058.5,
"valid_targets_min": 1084
},
{
"epoch": 2.608695652173913,
"grad_norm": 0.545185315512466,
"learning_rate": 3.161183965711738e-05,
"loss": 0.2983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3102641701698303,
"step": 3420,
"valid_targets_mean": 2958.9,
"valid_targets_min": 526
},
{
"epoch": 2.612509534706331,
"grad_norm": 0.4525570772787872,
"learning_rate": 3.158084799994787e-05,
"loss": 0.3095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27811145782470703,
"step": 3425,
"valid_targets_mean": 4219.3,
"valid_targets_min": 1192
},
{
"epoch": 2.616323417238749,
"grad_norm": 0.4151885367952925,
"learning_rate": 3.154981445136121e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30080297589302063,
"step": 3430,
"valid_targets_mean": 4943.1,
"valid_targets_min": 1128
},
{
"epoch": 2.620137299771167,
"grad_norm": 0.4653213080790013,
"learning_rate": 3.15187391236151e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3620241582393646,
"step": 3435,
"valid_targets_mean": 4422.7,
"valid_targets_min": 1005
},
{
"epoch": 2.623951182303585,
"grad_norm": 1.4191783668873799,
"learning_rate": 3.148762212911837e-05,
"loss": 0.4368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6156240105628967,
"step": 3440,
"valid_targets_mean": 883.6,
"valid_targets_min": 580
},
{
"epoch": 2.627765064836003,
"grad_norm": 0.48590288960795086,
"learning_rate": 3.145646358043055e-05,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34322547912597656,
"step": 3445,
"valid_targets_mean": 4622.9,
"valid_targets_min": 812
},
{
"epoch": 2.6315789473684212,
"grad_norm": 0.4771826596173598,
"learning_rate": 3.1425263590261514e-05,
"loss": 0.2979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32992804050445557,
"step": 3450,
"valid_targets_mean": 4304.2,
"valid_targets_min": 883
},
{
"epoch": 2.635392829900839,
"grad_norm": 1.5209723851975487,
"learning_rate": 3.139402227147103e-05,
"loss": 0.3126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33348479866981506,
"step": 3455,
"valid_targets_mean": 4633.4,
"valid_targets_min": 465
},
{
"epoch": 2.639206712433257,
"grad_norm": 0.5310761075855137,
"learning_rate": 3.136273973706835e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2709449231624603,
"step": 3460,
"valid_targets_mean": 3417.8,
"valid_targets_min": 1029
},
{
"epoch": 2.643020594965675,
"grad_norm": 0.43586930927383066,
"learning_rate": 3.133141610021184e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2855277955532074,
"step": 3465,
"valid_targets_mean": 4236.7,
"valid_targets_min": 1145
},
{
"epoch": 2.646834477498093,
"grad_norm": 0.4567606109152964,
"learning_rate": 3.1300051474208524e-05,
"loss": 0.313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2981013059616089,
"step": 3470,
"valid_targets_mean": 4365.1,
"valid_targets_min": 1106
},
{
"epoch": 2.650648360030511,
"grad_norm": 0.40779512282622354,
"learning_rate": 3.126864597251371e-05,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3078835904598236,
"step": 3475,
"valid_targets_mean": 5027.8,
"valid_targets_min": 1074
},
{
"epoch": 2.654462242562929,
"grad_norm": 0.4536802053876773,
"learning_rate": 3.123719970873057e-05,
"loss": 0.3153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3421435058116913,
"step": 3480,
"valid_targets_mean": 4348.9,
"valid_targets_min": 1020
},
{
"epoch": 2.6582761250953473,
"grad_norm": 0.45825952562012484,
"learning_rate": 3.120571279660971e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28770169615745544,
"step": 3485,
"valid_targets_mean": 3902.5,
"valid_targets_min": 1043
},
{
"epoch": 2.662090007627765,
"grad_norm": 0.47396470274603764,
"learning_rate": 3.1174185350048776e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27201271057128906,
"step": 3490,
"valid_targets_mean": 3508.6,
"valid_targets_min": 818
},
{
"epoch": 2.665903890160183,
"grad_norm": 0.42584203050280256,
"learning_rate": 3.114261748309205e-05,
"loss": 0.3035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2914293110370636,
"step": 3495,
"valid_targets_mean": 4368.4,
"valid_targets_min": 1077
},
{
"epoch": 2.669717772692601,
"grad_norm": 0.4556486758423126,
"learning_rate": 3.111100930993002e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26826319098472595,
"step": 3500,
"valid_targets_mean": 3759.3,
"valid_targets_min": 862
},
{
"epoch": 2.6735316552250192,
"grad_norm": 0.4313304144373171,
"learning_rate": 3.107936094489897e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.337573379278183,
"step": 3505,
"valid_targets_mean": 4508.1,
"valid_targets_min": 1212
},
{
"epoch": 2.677345537757437,
"grad_norm": 0.503822426279713,
"learning_rate": 3.104767250248056e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29460129141807556,
"step": 3510,
"valid_targets_mean": 3213.6,
"valid_targets_min": 1394
},
{
"epoch": 2.681159420289855,
"grad_norm": 0.443539023387382,
"learning_rate": 3.101594409730146e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3758798837661743,
"step": 3515,
"valid_targets_mean": 5032.7,
"valid_targets_min": 854
},
{
"epoch": 2.6849733028222733,
"grad_norm": 0.41385413645152297,
"learning_rate": 3.098417584413286e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24815471470355988,
"step": 3520,
"valid_targets_mean": 4305.5,
"valid_targets_min": 785
},
{
"epoch": 2.688787185354691,
"grad_norm": 0.46687358767596643,
"learning_rate": 3.0952367857890116e-05,
"loss": 0.2956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29929205775260925,
"step": 3525,
"valid_targets_mean": 3941.3,
"valid_targets_min": 472
},
{
"epoch": 2.692601067887109,
"grad_norm": 0.4396263260549913,
"learning_rate": 3.092052025363229e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32522842288017273,
"step": 3530,
"valid_targets_mean": 4580.7,
"valid_targets_min": 1340
},
{
"epoch": 2.696414950419527,
"grad_norm": 0.4680531415671467,
"learning_rate": 3.0888633146561756e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3260200023651123,
"step": 3535,
"valid_targets_mean": 4359.8,
"valid_targets_min": 1293
},
{
"epoch": 2.700228832951945,
"grad_norm": 0.4542256878885209,
"learning_rate": 3.0856706652023806e-05,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30608275532722473,
"step": 3540,
"valid_targets_mean": 4218.7,
"valid_targets_min": 450
},
{
"epoch": 2.704042715484363,
"grad_norm": 0.545077179745613,
"learning_rate": 3.082474088550619e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3118705749511719,
"step": 3545,
"valid_targets_mean": 3472.2,
"valid_targets_min": 417
},
{
"epoch": 2.707856598016781,
"grad_norm": 0.46674246079597687,
"learning_rate": 3.079273596263871e-05,
"loss": 0.3222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3758425712585449,
"step": 3550,
"valid_targets_mean": 4451.0,
"valid_targets_min": 875
},
{
"epoch": 2.7116704805491993,
"grad_norm": 0.4322217416895522,
"learning_rate": 3.0760691999192815e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.267362117767334,
"step": 3555,
"valid_targets_mean": 4483.9,
"valid_targets_min": 300
},
{
"epoch": 2.7154843630816172,
"grad_norm": 0.45976089928354635,
"learning_rate": 3.072860911108119e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29339703917503357,
"step": 3560,
"valid_targets_mean": 4354.7,
"valid_targets_min": 1286
},
{
"epoch": 2.719298245614035,
"grad_norm": 0.3995874661946734,
"learning_rate": 3.06964874143573e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29337623715400696,
"step": 3565,
"valid_targets_mean": 5228.0,
"valid_targets_min": 981
},
{
"epoch": 2.723112128146453,
"grad_norm": 0.4521775129579294,
"learning_rate": 3.0664327025214996e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29508697986602783,
"step": 3570,
"valid_targets_mean": 3820.0,
"valid_targets_min": 878
},
{
"epoch": 2.726926010678871,
"grad_norm": 0.4276913646473351,
"learning_rate": 3.063212805998812e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3139476478099823,
"step": 3575,
"valid_targets_mean": 4368.1,
"valid_targets_min": 1600
},
{
"epoch": 2.730739893211289,
"grad_norm": 0.4514060342213421,
"learning_rate": 3.059989063515001e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3006206452846527,
"step": 3580,
"valid_targets_mean": 3854.9,
"valid_targets_min": 494
},
{
"epoch": 2.734553775743707,
"grad_norm": 0.4603411167652157,
"learning_rate": 3.056761486731316e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3349507749080658,
"step": 3585,
"valid_targets_mean": 4717.0,
"valid_targets_min": 1189
},
{
"epoch": 2.738367658276125,
"grad_norm": 0.44757870922058896,
"learning_rate": 3.053530087322874e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3137572705745697,
"step": 3590,
"valid_targets_mean": 4155.7,
"valid_targets_min": 1165
},
{
"epoch": 2.7421815408085433,
"grad_norm": 0.4427568139153059,
"learning_rate": 3.0502948769786206e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34423160552978516,
"step": 3595,
"valid_targets_mean": 4736.5,
"valid_targets_min": 361
},
{
"epoch": 2.745995423340961,
"grad_norm": 0.427371158670119,
"learning_rate": 3.047055867401287e-05,
"loss": 0.3058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.270975798368454,
"step": 3600,
"valid_targets_mean": 4545.8,
"valid_targets_min": 1154
},
{
"epoch": 2.749809305873379,
"grad_norm": 1.452402046964983,
"learning_rate": 3.043813070307347e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5670013427734375,
"step": 3605,
"valid_targets_mean": 850.0,
"valid_targets_min": 591
},
{
"epoch": 2.753623188405797,
"grad_norm": 0.48169002835878383,
"learning_rate": 3.0405664974269738e-05,
"loss": 0.4169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203207850456238,
"step": 3610,
"valid_targets_mean": 4759.4,
"valid_targets_min": 1427
},
{
"epoch": 2.757437070938215,
"grad_norm": 0.42776785443748766,
"learning_rate": 3.037316160504001e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30834314227104187,
"step": 3615,
"valid_targets_mean": 4934.1,
"valid_targets_min": 1323
},
{
"epoch": 2.761250953470633,
"grad_norm": 0.4070539421650789,
"learning_rate": 3.0340620712958765e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30431488156318665,
"step": 3620,
"valid_targets_mean": 5120.2,
"valid_targets_min": 1434
},
{
"epoch": 2.765064836003051,
"grad_norm": 0.41518918429874707,
"learning_rate": 3.0308042415736215e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3664722442626953,
"step": 3625,
"valid_targets_mean": 5194.8,
"valid_targets_min": 1098
},
{
"epoch": 2.7688787185354693,
"grad_norm": 0.4102430332242187,
"learning_rate": 3.0275426831217883e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33445557951927185,
"step": 3630,
"valid_targets_mean": 5132.5,
"valid_targets_min": 1481
},
{
"epoch": 2.772692601067887,
"grad_norm": 0.4735233795742744,
"learning_rate": 3.024277407738416e-05,
"loss": 0.3099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2750890254974365,
"step": 3635,
"valid_targets_mean": 3928.4,
"valid_targets_min": 1393
},
{
"epoch": 2.776506483600305,
"grad_norm": 0.42393895318486075,
"learning_rate": 3.02100842723499e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33074259757995605,
"step": 3640,
"valid_targets_mean": 4961.6,
"valid_targets_min": 1262
},
{
"epoch": 2.780320366132723,
"grad_norm": 0.39335349576447576,
"learning_rate": 3.017735753436398e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31892308592796326,
"step": 3645,
"valid_targets_mean": 5054.6,
"valid_targets_min": 967
},
{
"epoch": 2.7841342486651413,
"grad_norm": 0.4374520203995769,
"learning_rate": 3.0144593981808863e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934619188308716,
"step": 3650,
"valid_targets_mean": 4071.9,
"valid_targets_min": 1746
},
{
"epoch": 2.787948131197559,
"grad_norm": 0.41212055790255153,
"learning_rate": 3.0111793733200213e-05,
"loss": 0.2933,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28573447465896606,
"step": 3655,
"valid_targets_mean": 4861.4,
"valid_targets_min": 964
},
{
"epoch": 2.791762013729977,
"grad_norm": 0.4177575764120052,
"learning_rate": 3.0078956907186396e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791755795478821,
"step": 3660,
"valid_targets_mean": 4278.7,
"valid_targets_min": 760
},
{
"epoch": 2.7955758962623953,
"grad_norm": 0.4328653362766987,
"learning_rate": 3.0046083622548115e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2922763526439667,
"step": 3665,
"valid_targets_mean": 4501.5,
"valid_targets_min": 1257
},
{
"epoch": 2.799389778794813,
"grad_norm": 0.4311685870770303,
"learning_rate": 3.0013173998197946e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3213293254375458,
"step": 3670,
"valid_targets_mean": 4659.9,
"valid_targets_min": 1254
},
{
"epoch": 2.803203661327231,
"grad_norm": 0.4739213958170537,
"learning_rate": 2.9980228153179913e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30476173758506775,
"step": 3675,
"valid_targets_mean": 4565.8,
"valid_targets_min": 1223
},
{
"epoch": 2.807017543859649,
"grad_norm": 0.4101207028641973,
"learning_rate": 2.9947246206669076e-05,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3138103783130646,
"step": 3680,
"valid_targets_mean": 4624.6,
"valid_targets_min": 1362
},
{
"epoch": 2.8108314263920673,
"grad_norm": 0.48502558987531175,
"learning_rate": 2.9914228277971062e-05,
"loss": 0.3113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3027869164943695,
"step": 3685,
"valid_targets_mean": 4354.0,
"valid_targets_min": 990
},
{
"epoch": 2.814645308924485,
"grad_norm": 0.4699784328853892,
"learning_rate": 2.988117448652168e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28289732336997986,
"step": 3690,
"valid_targets_mean": 3449.4,
"valid_targets_min": 1076
},
{
"epoch": 2.818459191456903,
"grad_norm": 0.42719126112782174,
"learning_rate": 2.9848084951886447e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29756590723991394,
"step": 3695,
"valid_targets_mean": 4744.5,
"valid_targets_min": 543
},
{
"epoch": 2.8222730739893214,
"grad_norm": 0.4756799163785362,
"learning_rate": 2.9814959793760185e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3334232270717621,
"step": 3700,
"valid_targets_mean": 4507.8,
"valid_targets_min": 1165
},
{
"epoch": 2.8260869565217392,
"grad_norm": 0.42435957538086944,
"learning_rate": 2.9781799131966575e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34517112374305725,
"step": 3705,
"valid_targets_mean": 5040.6,
"valid_targets_min": 1024
},
{
"epoch": 2.829900839054157,
"grad_norm": 0.4183943383548955,
"learning_rate": 2.974860308645772e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884375751018524,
"step": 3710,
"valid_targets_mean": 4425.5,
"valid_targets_min": 1392
},
{
"epoch": 2.833714721586575,
"grad_norm": 0.45371760515340676,
"learning_rate": 2.9715371777313727e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3239792287349701,
"step": 3715,
"valid_targets_mean": 4472.9,
"valid_targets_min": 842
},
{
"epoch": 2.837528604118993,
"grad_norm": 0.42123373483544757,
"learning_rate": 2.9682105324742246e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30317559838294983,
"step": 3720,
"valid_targets_mean": 4990.8,
"valid_targets_min": 1136
},
{
"epoch": 2.841342486651411,
"grad_norm": 0.40908457717851815,
"learning_rate": 2.9648803849078062e-05,
"loss": 0.2994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726430594921112,
"step": 3725,
"valid_targets_mean": 4901.2,
"valid_targets_min": 1492
},
{
"epoch": 2.845156369183829,
"grad_norm": 0.5131351131948333,
"learning_rate": 2.9615467470782658e-05,
"loss": 0.3129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32720550894737244,
"step": 3730,
"valid_targets_mean": 3929.0,
"valid_targets_min": 424
},
{
"epoch": 2.8489702517162474,
"grad_norm": 0.4560432871680669,
"learning_rate": 2.9582096310443753e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27139559388160706,
"step": 3735,
"valid_targets_mean": 3375.7,
"valid_targets_min": 554
},
{
"epoch": 2.8527841342486653,
"grad_norm": 0.464944255448322,
"learning_rate": 2.9548690488774883e-05,
"loss": 0.315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30860528349876404,
"step": 3740,
"valid_targets_mean": 4120.4,
"valid_targets_min": 848
},
{
"epoch": 2.856598016781083,
"grad_norm": 0.4357985611831835,
"learning_rate": 2.9515250126614988e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2578648626804352,
"step": 3745,
"valid_targets_mean": 4417.2,
"valid_targets_min": 1523
},
{
"epoch": 2.860411899313501,
"grad_norm": 0.4555909983730694,
"learning_rate": 2.948177534492793e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3738441467285156,
"step": 3750,
"valid_targets_mean": 5224.7,
"valid_targets_min": 1249
},
{
"epoch": 2.864225781845919,
"grad_norm": 0.4515471831618389,
"learning_rate": 2.944826626480208e-05,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27258816361427307,
"step": 3755,
"valid_targets_mean": 3902.9,
"valid_targets_min": 1391
},
{
"epoch": 2.8680396643783372,
"grad_norm": 0.4356700442556603,
"learning_rate": 2.9414723007449876e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3169298768043518,
"step": 3760,
"valid_targets_mean": 4445.8,
"valid_targets_min": 1054
},
{
"epoch": 2.871853546910755,
"grad_norm": 0.4477854060376825,
"learning_rate": 2.938114569420739e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050214350223541,
"step": 3765,
"valid_targets_mean": 4350.8,
"valid_targets_min": 1397
},
{
"epoch": 2.875667429443173,
"grad_norm": 1.498343127858281,
"learning_rate": 2.934753444653389e-05,
"loss": 0.3958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5911208391189575,
"step": 3770,
"valid_targets_mean": 914.1,
"valid_targets_min": 588
},
{
"epoch": 2.8794813119755913,
"grad_norm": 0.46199008167543115,
"learning_rate": 2.9313889386011373e-05,
"loss": 0.4099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3243425786495209,
"step": 3775,
"valid_targets_mean": 4639.8,
"valid_targets_min": 1284
},
{
"epoch": 2.883295194508009,
"grad_norm": 0.443878665174957,
"learning_rate": 2.9280210634344172e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30592426657676697,
"step": 3780,
"valid_targets_mean": 4357.5,
"valid_targets_min": 1020
},
{
"epoch": 2.887109077040427,
"grad_norm": 0.4237997285481469,
"learning_rate": 2.924649831335848e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26578041911125183,
"step": 3785,
"valid_targets_mean": 4502.4,
"valid_targets_min": 1004
},
{
"epoch": 2.890922959572845,
"grad_norm": 0.4445408846354412,
"learning_rate": 2.9212752545001925e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063945174217224,
"step": 3790,
"valid_targets_mean": 4339.8,
"valid_targets_min": 930
},
{
"epoch": 2.8947368421052633,
"grad_norm": 0.4220627608061861,
"learning_rate": 2.917897345134311e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3011779487133026,
"step": 3795,
"valid_targets_mean": 4646.5,
"valid_targets_min": 1421
},
{
"epoch": 2.898550724637681,
"grad_norm": 0.4253729735024821,
"learning_rate": 2.9145161154571204e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31455233693122864,
"step": 3800,
"valid_targets_mean": 4599.2,
"valid_targets_min": 832
},
{
"epoch": 2.902364607170099,
"grad_norm": 0.4086984176466762,
"learning_rate": 2.9111315776995474e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28731080889701843,
"step": 3805,
"valid_targets_mean": 4735.2,
"valid_targets_min": 826
},
{
"epoch": 2.9061784897025174,
"grad_norm": 0.4325378865974398,
"learning_rate": 2.907743744104485e-05,
"loss": 0.3131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2914287745952606,
"step": 3810,
"valid_targets_mean": 4252.8,
"valid_targets_min": 1127
},
{
"epoch": 2.9099923722349352,
"grad_norm": 0.4750481419343565,
"learning_rate": 2.9043526269267476e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.324870765209198,
"step": 3815,
"valid_targets_mean": 3894.4,
"valid_targets_min": 1215
},
{
"epoch": 2.913806254767353,
"grad_norm": 0.4681688455199492,
"learning_rate": 2.9009582384330285e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3059101402759552,
"step": 3820,
"valid_targets_mean": 4010.4,
"valid_targets_min": 481
},
{
"epoch": 2.917620137299771,
"grad_norm": 0.4279954633684007,
"learning_rate": 2.897560590901854e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050711452960968,
"step": 3825,
"valid_targets_mean": 4967.6,
"valid_targets_min": 1270
},
{
"epoch": 2.9214340198321893,
"grad_norm": 0.4097007390277408,
"learning_rate": 2.894159696623539e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2968205511569977,
"step": 3830,
"valid_targets_mean": 5721.0,
"valid_targets_min": 1628
},
{
"epoch": 2.925247902364607,
"grad_norm": 0.44134858980535835,
"learning_rate": 2.8907555679001422e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3263862133026123,
"step": 3835,
"valid_targets_mean": 4728.2,
"valid_targets_min": 1357
},
{
"epoch": 2.929061784897025,
"grad_norm": 0.4782226338188455,
"learning_rate": 2.8873482170454242e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3298240602016449,
"step": 3840,
"valid_targets_mean": 3894.2,
"valid_targets_min": 1206
},
{
"epoch": 2.9328756674294434,
"grad_norm": 0.4034262588335436,
"learning_rate": 2.8839376563847995e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2946132719516754,
"step": 3845,
"valid_targets_mean": 4810.2,
"valid_targets_min": 1163
},
{
"epoch": 2.9366895499618613,
"grad_norm": 0.45988183381124215,
"learning_rate": 2.880523898255293e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35728612542152405,
"step": 3850,
"valid_targets_mean": 4159.2,
"valid_targets_min": 1360
},
{
"epoch": 2.940503432494279,
"grad_norm": 0.43358117533596885,
"learning_rate": 2.877106955005498e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3028857111930847,
"step": 3855,
"valid_targets_mean": 4309.5,
"valid_targets_min": 387
},
{
"epoch": 2.944317315026697,
"grad_norm": 0.47832181313680316,
"learning_rate": 2.8736868389955268e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3072889745235443,
"step": 3860,
"valid_targets_mean": 3768.3,
"valid_targets_min": 1367
},
{
"epoch": 2.948131197559115,
"grad_norm": 0.4028436185145172,
"learning_rate": 2.8702635625969695e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28554582595825195,
"step": 3865,
"valid_targets_mean": 4673.5,
"valid_targets_min": 1133
},
{
"epoch": 2.9519450800915332,
"grad_norm": 0.448691951998679,
"learning_rate": 2.8668371381928496e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3088511526584625,
"step": 3870,
"valid_targets_mean": 4255.3,
"valid_targets_min": 927
},
{
"epoch": 2.955758962623951,
"grad_norm": 0.4163765087317686,
"learning_rate": 2.8634075781775763e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292270690202713,
"step": 3875,
"valid_targets_mean": 4703.5,
"valid_targets_min": 1051
},
{
"epoch": 2.9595728451563694,
"grad_norm": 0.39036304470600586,
"learning_rate": 2.859974894956901e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2601741850376129,
"step": 3880,
"valid_targets_mean": 4793.8,
"valid_targets_min": 833
},
{
"epoch": 2.9633867276887873,
"grad_norm": 0.42515271525416554,
"learning_rate": 2.8565391009478744e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3349475860595703,
"step": 3885,
"valid_targets_mean": 4686.7,
"valid_targets_min": 539
},
{
"epoch": 2.967200610221205,
"grad_norm": 0.4970234362822981,
"learning_rate": 2.8531002085787985e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32301023602485657,
"step": 3890,
"valid_targets_mean": 3944.5,
"valid_targets_min": 1142
},
{
"epoch": 2.971014492753623,
"grad_norm": 0.42196977157148824,
"learning_rate": 2.8496582302891824e-05,
"loss": 0.3109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27662238478660583,
"step": 3895,
"valid_targets_mean": 4858.2,
"valid_targets_min": 1367
},
{
"epoch": 2.974828375286041,
"grad_norm": 0.47386191834873953,
"learning_rate": 2.8462131785297003e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30710312724113464,
"step": 3900,
"valid_targets_mean": 4201.6,
"valid_targets_min": 1091
},
{
"epoch": 2.9786422578184593,
"grad_norm": 0.4299488991621925,
"learning_rate": 2.8427650657621414e-05,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34638655185699463,
"step": 3905,
"valid_targets_mean": 5343.2,
"valid_targets_min": 1217
},
{
"epoch": 2.982456140350877,
"grad_norm": 0.4249651616035499,
"learning_rate": 2.8393139044593687e-05,
"loss": 0.3048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2586444318294525,
"step": 3910,
"valid_targets_mean": 4284.1,
"valid_targets_min": 781
},
{
"epoch": 2.9862700228832955,
"grad_norm": 0.41092107449889226,
"learning_rate": 2.8358597071052737e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768830955028534,
"step": 3915,
"valid_targets_mean": 4534.6,
"valid_targets_min": 487
},
{
"epoch": 2.9900839054157133,
"grad_norm": 0.47463601161870095,
"learning_rate": 2.8324024861947284e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30442145466804504,
"step": 3920,
"valid_targets_mean": 3462.0,
"valid_targets_min": 603
},
{
"epoch": 2.993897787948131,
"grad_norm": 0.4527064420033862,
"learning_rate": 2.828942254233543e-05,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34296974539756775,
"step": 3925,
"valid_targets_mean": 4257.3,
"valid_targets_min": 775
},
{
"epoch": 2.997711670480549,
"grad_norm": 1.5493618786931598,
"learning_rate": 2.825479023738419e-05,
"loss": 0.3772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6141933798789978,
"step": 3930,
"valid_targets_mean": 912.7,
"valid_targets_min": 582
},
{
"epoch": 3.0015255530129674,
"grad_norm": 0.48310757043244024,
"learning_rate": 2.822012807236905e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2655656039714813,
"step": 3935,
"valid_targets_mean": 4215.5,
"valid_targets_min": 1273
},
{
"epoch": 3.0053394355453853,
"grad_norm": 0.5201274345684972,
"learning_rate": 2.8185436172673505e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.290056049823761,
"step": 3940,
"valid_targets_mean": 3994.8,
"valid_targets_min": 391
},
{
"epoch": 3.009153318077803,
"grad_norm": 0.4900178443387472,
"learning_rate": 2.8150714663788607e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2928362786769867,
"step": 3945,
"valid_targets_mean": 3524.9,
"valid_targets_min": 778
},
{
"epoch": 3.012967200610221,
"grad_norm": 0.4611566543168008,
"learning_rate": 2.8115963671312522e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869776785373688,
"step": 3950,
"valid_targets_mean": 4752.8,
"valid_targets_min": 1034
},
{
"epoch": 3.0167810831426394,
"grad_norm": 0.4220079332151452,
"learning_rate": 2.8081183320950062e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2875734269618988,
"step": 3955,
"valid_targets_mean": 4435.6,
"valid_targets_min": 477
},
{
"epoch": 3.0205949656750573,
"grad_norm": 0.43505589011064627,
"learning_rate": 2.804637373851223e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2964635193347931,
"step": 3960,
"valid_targets_mean": 5017.0,
"valid_targets_min": 859
},
{
"epoch": 3.024408848207475,
"grad_norm": 0.4392891751276722,
"learning_rate": 2.8011535049915787e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092955946922302,
"step": 3965,
"valid_targets_mean": 4434.5,
"valid_targets_min": 1018
},
{
"epoch": 3.028222730739893,
"grad_norm": 0.4756626096657287,
"learning_rate": 2.7976667381182755e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33730098605155945,
"step": 3970,
"valid_targets_mean": 4181.9,
"valid_targets_min": 1217
},
{
"epoch": 3.0320366132723113,
"grad_norm": 0.425272209059621,
"learning_rate": 2.7941770858440013e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.308401495218277,
"step": 3975,
"valid_targets_mean": 4507.3,
"valid_targets_min": 958
},
{
"epoch": 3.035850495804729,
"grad_norm": 0.47261764078577734,
"learning_rate": 2.7906845607918787e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3633866012096405,
"step": 3980,
"valid_targets_mean": 4527.0,
"valid_targets_min": 969
},
{
"epoch": 3.039664378337147,
"grad_norm": 0.45027923592941194,
"learning_rate": 2.7871891755954244e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2875222861766815,
"step": 3985,
"valid_targets_mean": 4281.4,
"valid_targets_min": 834
},
{
"epoch": 3.0434782608695654,
"grad_norm": 0.42756509589119934,
"learning_rate": 2.7836909428984985e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3177221119403839,
"step": 3990,
"valid_targets_mean": 4449.5,
"valid_targets_min": 1005
},
{
"epoch": 3.0472921434019833,
"grad_norm": 0.4595474259293521,
"learning_rate": 2.7801898753552646e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.304095596075058,
"step": 3995,
"valid_targets_mean": 4377.5,
"valid_targets_min": 325
},
{
"epoch": 3.051106025934401,
"grad_norm": 0.4259516268464371,
"learning_rate": 2.7766859856301383e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192457854747772,
"step": 4000,
"valid_targets_mean": 4967.5,
"valid_targets_min": 933
},
{
"epoch": 3.054919908466819,
"grad_norm": 0.4444180247560326,
"learning_rate": 2.7731792863977444e-05,
"loss": 0.2954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2878134250640869,
"step": 4005,
"valid_targets_mean": 4432.8,
"valid_targets_min": 1049
},
{
"epoch": 3.0587337909992374,
"grad_norm": 0.4431622200695571,
"learning_rate": 2.7696697903428713e-05,
"loss": 0.3019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2699919044971466,
"step": 4010,
"valid_targets_mean": 4070.9,
"valid_targets_min": 1169
},
{
"epoch": 3.0625476735316552,
"grad_norm": 0.42489671707301224,
"learning_rate": 2.7661575101604232e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29186615347862244,
"step": 4015,
"valid_targets_mean": 5442.9,
"valid_targets_min": 1401
},
{
"epoch": 3.066361556064073,
"grad_norm": 0.4245146413695337,
"learning_rate": 2.7626424585553767e-05,
"loss": 0.3123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325810045003891,
"step": 4020,
"valid_targets_mean": 4809.8,
"valid_targets_min": 1066
},
{
"epoch": 3.0701754385964914,
"grad_norm": 0.3791123204554425,
"learning_rate": 2.7591246482427324e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24728161096572876,
"step": 4025,
"valid_targets_mean": 5028.0,
"valid_targets_min": 1443
},
{
"epoch": 3.0739893211289093,
"grad_norm": 0.43633981308469355,
"learning_rate": 2.7556040919474703e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3360931873321533,
"step": 4030,
"valid_targets_mean": 4940.6,
"valid_targets_min": 1513
},
{
"epoch": 3.077803203661327,
"grad_norm": 0.39657770661164027,
"learning_rate": 2.7520808024045023e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28438836336135864,
"step": 4035,
"valid_targets_mean": 4996.4,
"valid_targets_min": 1644
},
{
"epoch": 3.081617086193745,
"grad_norm": 0.45447668831956933,
"learning_rate": 2.748554792358631e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27318766713142395,
"step": 4040,
"valid_targets_mean": 3740.3,
"valid_targets_min": 1075
},
{
"epoch": 3.0854309687261634,
"grad_norm": 0.4367756589898555,
"learning_rate": 2.745026074564495e-05,
"loss": 0.3164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054395318031311,
"step": 4045,
"valid_targets_mean": 4505.4,
"valid_targets_min": 846
},
{
"epoch": 3.0892448512585813,
"grad_norm": 0.4223604121541854,
"learning_rate": 2.7414946617865314e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2978456914424896,
"step": 4050,
"valid_targets_mean": 4903.7,
"valid_targets_min": 337
},
{
"epoch": 3.093058733790999,
"grad_norm": 0.43033237877389213,
"learning_rate": 2.737960566798924e-05,
"loss": 0.316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2762766480445862,
"step": 4055,
"valid_targets_mean": 4822.3,
"valid_targets_min": 1422
},
{
"epoch": 3.096872616323417,
"grad_norm": 0.40857330036886025,
"learning_rate": 2.7344238023855584e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27897074818611145,
"step": 4060,
"valid_targets_mean": 4889.1,
"valid_targets_min": 1257
},
{
"epoch": 3.1006864988558354,
"grad_norm": 0.452005688420249,
"learning_rate": 2.7308843813399786e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30446675419807434,
"step": 4065,
"valid_targets_mean": 4752.8,
"valid_targets_min": 223
},
{
"epoch": 3.1045003813882532,
"grad_norm": 0.4060532799872907,
"learning_rate": 2.7273423164653364e-05,
"loss": 0.2954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31288203597068787,
"step": 4070,
"valid_targets_mean": 4683.4,
"valid_targets_min": 1248
},
{
"epoch": 3.108314263920671,
"grad_norm": 0.4090987889175147,
"learning_rate": 2.7237976205743483e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30633795261383057,
"step": 4075,
"valid_targets_mean": 4901.8,
"valid_targets_min": 1770
},
{
"epoch": 3.1121281464530894,
"grad_norm": 0.43929196666659526,
"learning_rate": 2.7202503064892472e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2629685401916504,
"step": 4080,
"valid_targets_mean": 4338.1,
"valid_targets_min": 382
},
{
"epoch": 3.1159420289855073,
"grad_norm": 0.43667857011990463,
"learning_rate": 2.7167003870417373e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2743583619594574,
"step": 4085,
"valid_targets_mean": 3987.3,
"valid_targets_min": 936
},
{
"epoch": 3.119755911517925,
"grad_norm": 0.432006100221033,
"learning_rate": 2.7131478750729478e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3109601140022278,
"step": 4090,
"valid_targets_mean": 4254.5,
"valid_targets_min": 1019
},
{
"epoch": 3.123569794050343,
"grad_norm": 1.52971297266124,
"learning_rate": 2.709592783433384e-05,
"loss": 0.4114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5797714591026306,
"step": 4095,
"valid_targets_mean": 871.8,
"valid_targets_min": 612
},
{
"epoch": 3.1273836765827614,
"grad_norm": 0.48384704512411747,
"learning_rate": 2.706035124982884e-05,
"loss": 0.363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33182665705680847,
"step": 4100,
"valid_targets_mean": 4583.2,
"valid_targets_min": 989
},
{
"epoch": 3.1311975591151793,
"grad_norm": 0.4293633304827102,
"learning_rate": 2.70247491259057e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3025500178337097,
"step": 4105,
"valid_targets_mean": 5153.6,
"valid_targets_min": 1300
},
{
"epoch": 3.135011441647597,
"grad_norm": 0.4137531220478505,
"learning_rate": 2.6989121591348042e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2954184114933014,
"step": 4110,
"valid_targets_mean": 4562.9,
"valid_targets_min": 1009
},
{
"epoch": 3.138825324180015,
"grad_norm": 0.44578706063633217,
"learning_rate": 2.695346877503138e-05,
"loss": 0.2964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28965505957603455,
"step": 4115,
"valid_targets_mean": 4348.2,
"valid_targets_min": 489
},
{
"epoch": 3.1426392067124334,
"grad_norm": 0.4231966599504782,
"learning_rate": 2.6917790805922712e-05,
"loss": 0.3074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3042294681072235,
"step": 4120,
"valid_targets_mean": 4731.0,
"valid_targets_min": 1170
},
{
"epoch": 3.1464530892448512,
"grad_norm": 0.4382111519022077,
"learning_rate": 2.6882087813079993e-05,
"loss": 0.3045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28395530581474304,
"step": 4125,
"valid_targets_mean": 4604.8,
"valid_targets_min": 1536
},
{
"epoch": 3.150266971777269,
"grad_norm": 0.41220279417697464,
"learning_rate": 2.684635992565172e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2971174418926239,
"step": 4130,
"valid_targets_mean": 4894.4,
"valid_targets_min": 1206
},
{
"epoch": 3.1540808543096874,
"grad_norm": 0.5066318014346421,
"learning_rate": 2.6810607272876407e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28627005219459534,
"step": 4135,
"valid_targets_mean": 3675.4,
"valid_targets_min": 1096
},
{
"epoch": 3.1578947368421053,
"grad_norm": 0.42053061864748154,
"learning_rate": 2.677482998408219e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23367096483707428,
"step": 4140,
"valid_targets_mean": 4173.1,
"valid_targets_min": 1378
},
{
"epoch": 3.161708619374523,
"grad_norm": 0.4314063513504651,
"learning_rate": 2.67390281886863e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894207239151001,
"step": 4145,
"valid_targets_mean": 4910.4,
"valid_targets_min": 1027
},
{
"epoch": 3.165522501906941,
"grad_norm": 0.39830842433372293,
"learning_rate": 2.6703202016194617e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2879965305328369,
"step": 4150,
"valid_targets_mean": 4634.0,
"valid_targets_min": 353
},
{
"epoch": 3.1693363844393594,
"grad_norm": 0.43997400948287896,
"learning_rate": 2.6667351596201207e-05,
"loss": 0.3169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28813639283180237,
"step": 4155,
"valid_targets_mean": 4294.4,
"valid_targets_min": 841
},
{
"epoch": 3.1731502669717773,
"grad_norm": 0.43562273667182827,
"learning_rate": 2.6631477058387836e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26361653208732605,
"step": 4160,
"valid_targets_mean": 4073.6,
"valid_targets_min": 448
},
{
"epoch": 3.176964149504195,
"grad_norm": 0.4022019133128142,
"learning_rate": 2.659557853252353e-05,
"loss": 0.2947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2975803017616272,
"step": 4165,
"valid_targets_mean": 5350.9,
"valid_targets_min": 1290
},
{
"epoch": 3.1807780320366135,
"grad_norm": 0.41775729801028555,
"learning_rate": 2.6559656148464065e-05,
"loss": 0.3094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31065797805786133,
"step": 4170,
"valid_targets_mean": 4931.3,
"valid_targets_min": 1049
},
{
"epoch": 3.1845919145690313,
"grad_norm": 0.42340874498162046,
"learning_rate": 2.6523710036151538e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28241145610809326,
"step": 4175,
"valid_targets_mean": 4305.8,
"valid_targets_min": 747
},
{
"epoch": 3.1884057971014492,
"grad_norm": 0.4206928272872279,
"learning_rate": 2.648774032561386e-05,
"loss": 0.2977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.308231920003891,
"step": 4180,
"valid_targets_mean": 5015.2,
"valid_targets_min": 962
},
{
"epoch": 3.192219679633867,
"grad_norm": 0.46998455382582077,
"learning_rate": 2.6451747146964324e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3151862919330597,
"step": 4185,
"valid_targets_mean": 4189.7,
"valid_targets_min": 895
},
{
"epoch": 3.1960335621662854,
"grad_norm": 0.44181960848776786,
"learning_rate": 2.6415730630401094e-05,
"loss": 0.2957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007621765136719,
"step": 4190,
"valid_targets_mean": 4348.0,
"valid_targets_min": 1047
},
{
"epoch": 3.1998474446987033,
"grad_norm": 0.3832339742293115,
"learning_rate": 2.6379690906206774e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31467732787132263,
"step": 4195,
"valid_targets_mean": 5705.5,
"valid_targets_min": 1138
},
{
"epoch": 3.203661327231121,
"grad_norm": 0.392229055026644,
"learning_rate": 2.63436281047479e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.293388694524765,
"step": 4200,
"valid_targets_mean": 5568.1,
"valid_targets_min": 1459
},
{
"epoch": 3.2074752097635395,
"grad_norm": 0.5283415619583283,
"learning_rate": 2.630754235647449e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3029252588748932,
"step": 4205,
"valid_targets_mean": 4410.8,
"valid_targets_min": 1391
},
{
"epoch": 3.2112890922959574,
"grad_norm": 0.4094720780562837,
"learning_rate": 2.6271433791919574e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3849099576473236,
"step": 4210,
"valid_targets_mean": 6173.7,
"valid_targets_min": 1324
},
{
"epoch": 3.2151029748283753,
"grad_norm": 0.43046488665942784,
"learning_rate": 2.6235302541698717e-05,
"loss": 0.2918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30120354890823364,
"step": 4215,
"valid_targets_mean": 4579.4,
"valid_targets_min": 1042
},
{
"epoch": 3.218916857360793,
"grad_norm": 0.4789181271781151,
"learning_rate": 2.6199148736509533e-05,
"loss": 0.3147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3252256512641907,
"step": 4220,
"valid_targets_mean": 4278.8,
"valid_targets_min": 1484
},
{
"epoch": 3.2227307398932115,
"grad_norm": 0.43690382548291334,
"learning_rate": 2.6162972507131233e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2524643540382385,
"step": 4225,
"valid_targets_mean": 3789.8,
"valid_targets_min": 850
},
{
"epoch": 3.2265446224256293,
"grad_norm": 0.4008308182938237,
"learning_rate": 2.6126773984424136e-05,
"loss": 0.3296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3713483512401581,
"step": 4230,
"valid_targets_mean": 6207.3,
"valid_targets_min": 1052
},
{
"epoch": 3.230358504958047,
"grad_norm": 0.41774399379354676,
"learning_rate": 2.6090553299329208e-05,
"loss": 0.3051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27272287011146545,
"step": 4235,
"valid_targets_mean": 4272.5,
"valid_targets_min": 279
},
{
"epoch": 3.234172387490465,
"grad_norm": 0.4093732314062262,
"learning_rate": 2.605431058286759e-05,
"loss": 0.2988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3073391020298004,
"step": 4240,
"valid_targets_mean": 4975.9,
"valid_targets_min": 706
},
{
"epoch": 3.2379862700228834,
"grad_norm": 0.47298284841603055,
"learning_rate": 2.6018045966140105e-05,
"loss": 0.2968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122836649417877,
"step": 4245,
"valid_targets_mean": 4119.1,
"valid_targets_min": 291
},
{
"epoch": 3.2418001525553013,
"grad_norm": 0.40428395385460597,
"learning_rate": 2.5981759580326796e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3531065285205841,
"step": 4250,
"valid_targets_mean": 6081.3,
"valid_targets_min": 1442
},
{
"epoch": 3.245614035087719,
"grad_norm": 0.4346135876532143,
"learning_rate": 2.594545155668646e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284991055727005,
"step": 4255,
"valid_targets_mean": 4164.0,
"valid_targets_min": 1551
},
{
"epoch": 3.2494279176201375,
"grad_norm": 1.295013445237469,
"learning_rate": 2.5909122026556156e-05,
"loss": 0.4469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5561190843582153,
"step": 4260,
"valid_targets_mean": 887.6,
"valid_targets_min": 564
},
{
"epoch": 3.2532418001525554,
"grad_norm": 0.5633888295443477,
"learning_rate": 2.5872771121350746e-05,
"loss": 0.4165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32503604888916016,
"step": 4265,
"valid_targets_mean": 3850.0,
"valid_targets_min": 1141
},
{
"epoch": 3.2570556826849733,
"grad_norm": 0.5281593372478045,
"learning_rate": 2.583639897256241e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3609069883823395,
"step": 4270,
"valid_targets_mean": 4185.0,
"valid_targets_min": 1144
},
{
"epoch": 3.260869565217391,
"grad_norm": 0.4891379681010717,
"learning_rate": 2.580000571176017e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29750365018844604,
"step": 4275,
"valid_targets_mean": 3510.4,
"valid_targets_min": 1197
},
{
"epoch": 3.2646834477498095,
"grad_norm": 0.43956221026432685,
"learning_rate": 2.5763591470589412e-05,
"loss": 0.3188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3253210783004761,
"step": 4280,
"valid_targets_mean": 4749.8,
"valid_targets_min": 1060
},
{
"epoch": 3.2684973302822273,
"grad_norm": 0.46292002185303716,
"learning_rate": 2.572715638077142e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33239755034446716,
"step": 4285,
"valid_targets_mean": 4043.5,
"valid_targets_min": 1669
},
{
"epoch": 3.272311212814645,
"grad_norm": 0.5074495934712384,
"learning_rate": 2.569070057410291e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32021841406822205,
"step": 4290,
"valid_targets_mean": 3380.5,
"valid_targets_min": 1275
},
{
"epoch": 3.276125095347063,
"grad_norm": 0.40410647442164166,
"learning_rate": 2.5654224182455503e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25639939308166504,
"step": 4295,
"valid_targets_mean": 4476.0,
"valid_targets_min": 1255
},
{
"epoch": 3.2799389778794814,
"grad_norm": 0.4379359856829999,
"learning_rate": 2.5617727337775304e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.308867871761322,
"step": 4300,
"valid_targets_mean": 4687.6,
"valid_targets_min": 943
},
{
"epoch": 3.2837528604118993,
"grad_norm": 0.4635823928148595,
"learning_rate": 2.5581210172082403e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24824810028076172,
"step": 4305,
"valid_targets_mean": 3754.1,
"valid_targets_min": 1090
},
{
"epoch": 3.287566742944317,
"grad_norm": 0.4683550105277778,
"learning_rate": 2.554467281747039e-05,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28184881806373596,
"step": 4310,
"valid_targets_mean": 4163.5,
"valid_targets_min": 842
},
{
"epoch": 3.2913806254767355,
"grad_norm": 0.4915064273261867,
"learning_rate": 2.550811540610589e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2834111750125885,
"step": 4315,
"valid_targets_mean": 3685.3,
"valid_targets_min": 552
},
{
"epoch": 3.2951945080091534,
"grad_norm": 0.3914255824084369,
"learning_rate": 2.5471538070228066e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567122280597687,
"step": 4320,
"valid_targets_mean": 5006.8,
"valid_targets_min": 757
},
{
"epoch": 3.2990083905415712,
"grad_norm": 0.472640247378806,
"learning_rate": 2.5434940942148183e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3348356783390045,
"step": 4325,
"valid_targets_mean": 4366.6,
"valid_targets_min": 1039
},
{
"epoch": 3.302822273073989,
"grad_norm": 0.4923236156250513,
"learning_rate": 2.5398324154249063e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34193626046180725,
"step": 4330,
"valid_targets_mean": 3921.7,
"valid_targets_min": 1132
},
{
"epoch": 3.3066361556064074,
"grad_norm": 0.471692146824963,
"learning_rate": 2.5361687838984677e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2816826403141022,
"step": 4335,
"valid_targets_mean": 3595.5,
"valid_targets_min": 1221
},
{
"epoch": 3.3104500381388253,
"grad_norm": 0.42190916943969575,
"learning_rate": 2.532503212887961e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2746467888355255,
"step": 4340,
"valid_targets_mean": 4154.9,
"valid_targets_min": 347
},
{
"epoch": 3.314263920671243,
"grad_norm": 0.453882889428085,
"learning_rate": 2.5288357156528615e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29759106040000916,
"step": 4345,
"valid_targets_mean": 4029.9,
"valid_targets_min": 1333
},
{
"epoch": 3.3180778032036615,
"grad_norm": 0.49862486651056076,
"learning_rate": 2.5251663054596115e-05,
"loss": 0.2935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28774699568748474,
"step": 4350,
"valid_targets_mean": 3458.5,
"valid_targets_min": 359
},
{
"epoch": 3.3218916857360794,
"grad_norm": 0.4382109576845958,
"learning_rate": 2.5214949955815744e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.273575097322464,
"step": 4355,
"valid_targets_mean": 4762.6,
"valid_targets_min": 1560
},
{
"epoch": 3.3257055682684973,
"grad_norm": 0.3952193306320817,
"learning_rate": 2.517821799298983e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2989937365055084,
"step": 4360,
"valid_targets_mean": 4993.2,
"valid_targets_min": 1108
},
{
"epoch": 3.329519450800915,
"grad_norm": 0.4299063443043704,
"learning_rate": 2.5141467298988966e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28979429602622986,
"step": 4365,
"valid_targets_mean": 4497.9,
"valid_targets_min": 1254
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.4678185856388349,
"learning_rate": 2.5104698006751478e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2760257422924042,
"step": 4370,
"valid_targets_mean": 3716.8,
"valid_targets_min": 751
},
{
"epoch": 3.3371472158657514,
"grad_norm": 0.44293102220158903,
"learning_rate": 2.5067910249282977e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28500014543533325,
"step": 4375,
"valid_targets_mean": 4523.8,
"valid_targets_min": 1655
},
{
"epoch": 3.3409610983981692,
"grad_norm": 0.5415466643652644,
"learning_rate": 2.503110415965587e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982900142669678,
"step": 4380,
"valid_targets_mean": 2946.4,
"valid_targets_min": 1071
},
{
"epoch": 3.3447749809305876,
"grad_norm": 0.44053774022930603,
"learning_rate": 2.4994279871008877e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2539463937282562,
"step": 4385,
"valid_targets_mean": 4374.5,
"valid_targets_min": 1125
},
{
"epoch": 3.3485888634630054,
"grad_norm": 0.44003841730672233,
"learning_rate": 2.4957437516546543e-05,
"loss": 0.2892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32349371910095215,
"step": 4390,
"valid_targets_mean": 4640.0,
"valid_targets_min": 919
},
{
"epoch": 3.3524027459954233,
"grad_norm": 0.4464447323916682,
"learning_rate": 2.4920577229538773e-05,
"loss": 0.2985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30756130814552307,
"step": 4395,
"valid_targets_mean": 4225.8,
"valid_targets_min": 1071
},
{
"epoch": 3.356216628527841,
"grad_norm": 0.4147797648169543,
"learning_rate": 2.4883699143320327e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3059729039669037,
"step": 4400,
"valid_targets_mean": 4530.5,
"valid_targets_min": 1432
},
{
"epoch": 3.3600305110602595,
"grad_norm": 0.48324594985252733,
"learning_rate": 2.4846803391290362e-05,
"loss": 0.289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28423330187797546,
"step": 4405,
"valid_targets_mean": 4117.8,
"valid_targets_min": 689
},
{
"epoch": 3.3638443935926774,
"grad_norm": 0.39510207327738245,
"learning_rate": 2.480989010691192e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29658064246177673,
"step": 4410,
"valid_targets_mean": 5399.8,
"valid_targets_min": 1256
},
{
"epoch": 3.3676582761250953,
"grad_norm": 0.42497343584852565,
"learning_rate": 2.4772959423711484e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3150722086429596,
"step": 4415,
"valid_targets_mean": 4667.6,
"valid_targets_min": 958
},
{
"epoch": 3.3714721586575136,
"grad_norm": 0.47430966618042086,
"learning_rate": 2.4736011475278466e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28610026836395264,
"step": 4420,
"valid_targets_mean": 4018.0,
"valid_targets_min": 525
},
{
"epoch": 3.3752860411899315,
"grad_norm": 1.3538687602475996,
"learning_rate": 2.4699046395264724e-05,
"loss": 0.4153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5354134440422058,
"step": 4425,
"valid_targets_mean": 843.5,
"valid_targets_min": 555
},
{
"epoch": 3.3790999237223494,
"grad_norm": 0.4434389928639025,
"learning_rate": 2.4662064317384093e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.321266770362854,
"step": 4430,
"valid_targets_mean": 5056.5,
"valid_targets_min": 590
},
{
"epoch": 3.3829138062547672,
"grad_norm": 0.4176548333395029,
"learning_rate": 2.4625065375411897e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2966906726360321,
"step": 4435,
"valid_targets_mean": 4763.8,
"valid_targets_min": 1576
},
{
"epoch": 3.386727688787185,
"grad_norm": 0.4832013590980464,
"learning_rate": 2.458804970318446e-05,
"loss": 0.304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32015255093574524,
"step": 4440,
"valid_targets_mean": 3990.1,
"valid_targets_min": 856
},
{
"epoch": 3.3905415713196034,
"grad_norm": 0.43037675012382226,
"learning_rate": 2.4551017434598618e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26767686009407043,
"step": 4445,
"valid_targets_mean": 4260.4,
"valid_targets_min": 395
},
{
"epoch": 3.3943554538520213,
"grad_norm": 0.4814709495318474,
"learning_rate": 2.4513968703611247e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948641777038574,
"step": 4450,
"valid_targets_mean": 3419.1,
"valid_targets_min": 531
},
{
"epoch": 3.398169336384439,
"grad_norm": 0.44472165177178047,
"learning_rate": 2.4476903644238773e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28508543968200684,
"step": 4455,
"valid_targets_mean": 4292.3,
"valid_targets_min": 506
},
{
"epoch": 3.4019832189168575,
"grad_norm": 0.41201008799766403,
"learning_rate": 2.4439822390556683e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31197693943977356,
"step": 4460,
"valid_targets_mean": 5086.9,
"valid_targets_min": 906
},
{
"epoch": 3.4057971014492754,
"grad_norm": 0.454379940882493,
"learning_rate": 2.4402725076699058e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770203649997711,
"step": 4465,
"valid_targets_mean": 4577.1,
"valid_targets_min": 997
},
{
"epoch": 3.4096109839816933,
"grad_norm": 0.527988293091776,
"learning_rate": 2.4365611836858045e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31560805439949036,
"step": 4470,
"valid_targets_mean": 4082.6,
"valid_targets_min": 545
},
{
"epoch": 3.413424866514111,
"grad_norm": 0.4064911273535986,
"learning_rate": 2.4328482805283425e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556368410587311,
"step": 4475,
"valid_targets_mean": 4709.9,
"valid_targets_min": 1240
},
{
"epoch": 3.4172387490465295,
"grad_norm": 0.5843567476660677,
"learning_rate": 2.4291338116282095e-05,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2823584973812103,
"step": 4480,
"valid_targets_mean": 3790.3,
"valid_targets_min": 820
},
{
"epoch": 3.4210526315789473,
"grad_norm": 0.4567750258288281,
"learning_rate": 2.4254177904217584e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.294177383184433,
"step": 4485,
"valid_targets_mean": 4076.5,
"valid_targets_min": 606
},
{
"epoch": 3.4248665141113652,
"grad_norm": 0.5011803624411254,
"learning_rate": 2.4217002303509585e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2771233022212982,
"step": 4490,
"valid_targets_mean": 3349.8,
"valid_targets_min": 1136
},
{
"epoch": 3.4286803966437835,
"grad_norm": 0.4659529424276567,
"learning_rate": 2.417981144863344e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3151896893978119,
"step": 4495,
"valid_targets_mean": 3970.9,
"valid_targets_min": 844
},
{
"epoch": 3.4324942791762014,
"grad_norm": 0.4365423762808735,
"learning_rate": 2.414260547411968e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2706001102924347,
"step": 4500,
"valid_targets_mean": 4455.2,
"valid_targets_min": 949
},
{
"epoch": 3.4363081617086193,
"grad_norm": 0.41739904226755675,
"learning_rate": 2.4105384514553536e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2490123063325882,
"step": 4505,
"valid_targets_mean": 4767.6,
"valid_targets_min": 1047
},
{
"epoch": 3.440122044241037,
"grad_norm": 0.44840746198558895,
"learning_rate": 2.406814870457443e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.279386430978775,
"step": 4510,
"valid_targets_mean": 4174.1,
"valid_targets_min": 571
},
{
"epoch": 3.4439359267734555,
"grad_norm": 0.4819890452945161,
"learning_rate": 2.4030898178875505e-05,
"loss": 0.2667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26938095688819885,
"step": 4515,
"valid_targets_mean": 3857.3,
"valid_targets_min": 414
},
{
"epoch": 3.4477498093058734,
"grad_norm": 0.44292361932334906,
"learning_rate": 2.399363307220314e-05,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2844865024089813,
"step": 4520,
"valid_targets_mean": 4402.6,
"valid_targets_min": 1365
},
{
"epoch": 3.4515636918382913,
"grad_norm": 0.46107216304175414,
"learning_rate": 2.3956353519356457e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33531391620635986,
"step": 4525,
"valid_targets_mean": 4102.7,
"valid_targets_min": 335
},
{
"epoch": 3.4553775743707096,
"grad_norm": 0.442565568837418,
"learning_rate": 2.3919059655186833e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26467326283454895,
"step": 4530,
"valid_targets_mean": 4285.3,
"valid_targets_min": 1265
},
{
"epoch": 3.4591914569031275,
"grad_norm": 0.4525205079659544,
"learning_rate": 2.388175161459741e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2614127993583679,
"step": 4535,
"valid_targets_mean": 4639.7,
"valid_targets_min": 896
},
{
"epoch": 3.4630053394355453,
"grad_norm": 0.4286446055548415,
"learning_rate": 2.384442953254262e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31952324509620667,
"step": 4540,
"valid_targets_mean": 4769.8,
"valid_targets_min": 1221
},
{
"epoch": 3.466819221967963,
"grad_norm": 0.4394695100350723,
"learning_rate": 2.380709354402767e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3081350326538086,
"step": 4545,
"valid_targets_mean": 4902.0,
"valid_targets_min": 1328
},
{
"epoch": 3.4706331045003815,
"grad_norm": 0.44252990452185964,
"learning_rate": 2.3769743784108098e-05,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2925524413585663,
"step": 4550,
"valid_targets_mean": 4228.0,
"valid_targets_min": 282
},
{
"epoch": 3.4744469870327994,
"grad_norm": 0.43649847593552715,
"learning_rate": 2.3732380387889226e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29324600100517273,
"step": 4555,
"valid_targets_mean": 4716.2,
"valid_targets_min": 1282
},
{
"epoch": 3.4782608695652173,
"grad_norm": 0.5901540282708677,
"learning_rate": 2.369500349052573e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33937153220176697,
"step": 4560,
"valid_targets_mean": 6044.2,
"valid_targets_min": 1284
},
{
"epoch": 3.4820747520976356,
"grad_norm": 0.48142713655684205,
"learning_rate": 2.3657613227221102e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688189446926117,
"step": 4565,
"valid_targets_mean": 3629.0,
"valid_targets_min": 1103
},
{
"epoch": 3.4858886346300535,
"grad_norm": 0.4492333230953052,
"learning_rate": 2.3620209733227192e-05,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25333163142204285,
"step": 4570,
"valid_targets_mean": 3804.1,
"valid_targets_min": 887
},
{
"epoch": 3.4897025171624714,
"grad_norm": 0.476448139584302,
"learning_rate": 2.3582793143843716e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2749543786048889,
"step": 4575,
"valid_targets_mean": 4068.4,
"valid_targets_min": 953
},
{
"epoch": 3.4935163996948893,
"grad_norm": 0.4359786993878809,
"learning_rate": 2.3545363594417743e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28557226061820984,
"step": 4580,
"valid_targets_mean": 4143.3,
"valid_targets_min": 1066
},
{
"epoch": 3.4973302822273076,
"grad_norm": 1.3429881064610008,
"learning_rate": 2.3507921220343248e-05,
"loss": 0.3855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5342379212379456,
"step": 4585,
"valid_targets_mean": 836.2,
"valid_targets_min": 603
},
{
"epoch": 3.5011441647597255,
"grad_norm": 0.5099271236627688,
"learning_rate": 2.347046615706057e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2950020730495453,
"step": 4590,
"valid_targets_mean": 4808.9,
"valid_targets_min": 1261
},
{
"epoch": 3.5049580472921433,
"grad_norm": 0.45148904022167163,
"learning_rate": 2.3432998540055968e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26813894510269165,
"step": 4595,
"valid_targets_mean": 4466.8,
"valid_targets_min": 1142
},
{
"epoch": 3.5087719298245617,
"grad_norm": 0.48016054420587306,
"learning_rate": 2.3395518504861095e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31315457820892334,
"step": 4600,
"valid_targets_mean": 3756.8,
"valid_targets_min": 813
},
{
"epoch": 3.5125858123569795,
"grad_norm": 0.3827932809867314,
"learning_rate": 2.3358026187052536e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2498505562543869,
"step": 4605,
"valid_targets_mean": 5474.2,
"valid_targets_min": 1300
},
{
"epoch": 3.5163996948893974,
"grad_norm": 0.4885836440650446,
"learning_rate": 2.3320521722251308e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3247798979282379,
"step": 4610,
"valid_targets_mean": 4359.9,
"valid_targets_min": 1083
},
{
"epoch": 3.5202135774218153,
"grad_norm": 0.4165894714535205,
"learning_rate": 2.328300524612236e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3320067822933197,
"step": 4615,
"valid_targets_mean": 5239.2,
"valid_targets_min": 1702
},
{
"epoch": 3.524027459954233,
"grad_norm": 0.39401369842550765,
"learning_rate": 2.3245476894374087e-05,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2737915515899658,
"step": 4620,
"valid_targets_mean": 5084.2,
"valid_targets_min": 1785
},
{
"epoch": 3.5278413424866515,
"grad_norm": 0.4594224574976198,
"learning_rate": 2.3207936802757844e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29349514842033386,
"step": 4625,
"valid_targets_mean": 4702.5,
"valid_targets_min": 1313
},
{
"epoch": 3.5316552250190694,
"grad_norm": 0.5133283887809664,
"learning_rate": 2.317038510706747e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30904343724250793,
"step": 4630,
"valid_targets_mean": 3583.6,
"valid_targets_min": 985
},
{
"epoch": 3.5354691075514877,
"grad_norm": 0.40462253402146175,
"learning_rate": 2.3132821943138756e-05,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26162537932395935,
"step": 4635,
"valid_targets_mean": 4592.1,
"valid_targets_min": 1251
},
{
"epoch": 3.5392829900839056,
"grad_norm": 0.4699941999637695,
"learning_rate": 2.3095247446848986e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2771185338497162,
"step": 4640,
"valid_targets_mean": 4387.5,
"valid_targets_min": 1457
},
{
"epoch": 3.5430968726163234,
"grad_norm": 0.4482896520378407,
"learning_rate": 2.305766175411643e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26876458525657654,
"step": 4645,
"valid_targets_mean": 3782.0,
"valid_targets_min": 1088
},
{
"epoch": 3.5469107551487413,
"grad_norm": 0.46170532954154736,
"learning_rate": 2.302006500089988e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3280665874481201,
"step": 4650,
"valid_targets_mean": 4604.7,
"valid_targets_min": 1161
},
{
"epoch": 3.550724637681159,
"grad_norm": 0.42087692641889823,
"learning_rate": 2.2982457323198104e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2573760747909546,
"step": 4655,
"valid_targets_mean": 4632.5,
"valid_targets_min": 1194
},
{
"epoch": 3.5545385202135775,
"grad_norm": 0.4551534237796107,
"learning_rate": 2.2944838857049422e-05,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25980302691459656,
"step": 4660,
"valid_targets_mean": 4064.3,
"valid_targets_min": 338
},
{
"epoch": 3.5583524027459954,
"grad_norm": 0.39263337796345454,
"learning_rate": 2.2907209738531152e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148830235004425,
"step": 4665,
"valid_targets_mean": 6088.7,
"valid_targets_min": 1367
},
{
"epoch": 3.5621662852784133,
"grad_norm": 0.5187964098178377,
"learning_rate": 2.2869570103759154e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31824734807014465,
"step": 4670,
"valid_targets_mean": 3209.6,
"valid_targets_min": 1198
},
{
"epoch": 3.5659801678108316,
"grad_norm": 0.39318418222353296,
"learning_rate": 2.283192008888734e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2371831089258194,
"step": 4675,
"valid_targets_mean": 4917.4,
"valid_targets_min": 1111
},
{
"epoch": 3.5697940503432495,
"grad_norm": 0.47860026377836923,
"learning_rate": 2.279425983010716e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3355828821659088,
"step": 4680,
"valid_targets_mean": 4329.6,
"valid_targets_min": 288
},
{
"epoch": 3.5736079328756674,
"grad_norm": 0.47204126314129596,
"learning_rate": 2.2756589463647107e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3069976270198822,
"step": 4685,
"valid_targets_mean": 3892.1,
"valid_targets_min": 1071
},
{
"epoch": 3.5774218154080852,
"grad_norm": 0.44038100652623313,
"learning_rate": 2.2718909125772255e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812940776348114,
"step": 4690,
"valid_targets_mean": 4560.3,
"valid_targets_min": 1493
},
{
"epoch": 3.5812356979405036,
"grad_norm": 0.47684570252296454,
"learning_rate": 2.2681218952783745e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3217027485370636,
"step": 4695,
"valid_targets_mean": 3902.1,
"valid_targets_min": 1093
},
{
"epoch": 3.5850495804729214,
"grad_norm": 0.4562186549419339,
"learning_rate": 2.2643519081018284e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30921462178230286,
"step": 4700,
"valid_targets_mean": 4113.0,
"valid_targets_min": 1199
},
{
"epoch": 3.5888634630053393,
"grad_norm": 0.44993134293451825,
"learning_rate": 2.2605809646847675e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672576606273651,
"step": 4705,
"valid_targets_mean": 4444.2,
"valid_targets_min": 312
},
{
"epoch": 3.5926773455377576,
"grad_norm": 0.5005018602677499,
"learning_rate": 2.2568090786678303e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2609889507293701,
"step": 4710,
"valid_targets_mean": 3446.8,
"valid_targets_min": 957
},
{
"epoch": 3.5964912280701755,
"grad_norm": 0.4415676866527957,
"learning_rate": 2.2530362636950646e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27837008237838745,
"step": 4715,
"valid_targets_mean": 3975.3,
"valid_targets_min": 368
},
{
"epoch": 3.6003051106025934,
"grad_norm": 0.48156304179055964,
"learning_rate": 2.24926253341388e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.327156126499176,
"step": 4720,
"valid_targets_mean": 4176.2,
"valid_targets_min": 366
},
{
"epoch": 3.6041189931350113,
"grad_norm": 0.4360672584760495,
"learning_rate": 2.245487901474996e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536308467388153,
"step": 4725,
"valid_targets_mean": 4185.0,
"valid_targets_min": 1214
},
{
"epoch": 3.6079328756674296,
"grad_norm": 0.40767628665247807,
"learning_rate": 2.2417123815323936e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2984670102596283,
"step": 4730,
"valid_targets_mean": 5542.7,
"valid_targets_min": 1423
},
{
"epoch": 3.6117467581998475,
"grad_norm": 0.45360199839129894,
"learning_rate": 2.2379359872432662e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2925918996334076,
"step": 4735,
"valid_targets_mean": 3912.8,
"valid_targets_min": 995
},
{
"epoch": 3.6155606407322654,
"grad_norm": 0.4946715128075741,
"learning_rate": 2.23415873226797e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30403146147727966,
"step": 4740,
"valid_targets_mean": 3816.2,
"valid_targets_min": 358
},
{
"epoch": 3.6193745232646837,
"grad_norm": 0.47406262208079786,
"learning_rate": 2.2303806302699744e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2904681861400604,
"step": 4745,
"valid_targets_mean": 4019.7,
"valid_targets_min": 249
},
{
"epoch": 3.6231884057971016,
"grad_norm": 1.6624652115903416,
"learning_rate": 2.2266016949158128e-05,
"loss": 0.3583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5583869218826294,
"step": 4750,
"valid_targets_mean": 827.7,
"valid_targets_min": 481
},
{
"epoch": 3.6270022883295194,
"grad_norm": 0.504124880570195,
"learning_rate": 2.2228219398750332e-05,
"loss": 0.442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2691499590873718,
"step": 4755,
"valid_targets_mean": 4826.3,
"valid_targets_min": 1355
},
{
"epoch": 3.6308161708619373,
"grad_norm": 0.4936141065951774,
"learning_rate": 2.2190413788201494e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2698126435279846,
"step": 4760,
"valid_targets_mean": 3571.9,
"valid_targets_min": 1043
},
{
"epoch": 3.634630053394355,
"grad_norm": 0.4304446140565006,
"learning_rate": 2.2152600254265893e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2709462642669678,
"step": 4765,
"valid_targets_mean": 4900.3,
"valid_targets_min": 1342
},
{
"epoch": 3.6384439359267735,
"grad_norm": 0.4034314385983401,
"learning_rate": 2.2114778933726478e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3143347203731537,
"step": 4770,
"valid_targets_mean": 5496.1,
"valid_targets_min": 803
},
{
"epoch": 3.6422578184591914,
"grad_norm": 0.43621856626978023,
"learning_rate": 2.2076949963394365e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2733272612094879,
"step": 4775,
"valid_targets_mean": 4515.8,
"valid_targets_min": 1413
},
{
"epoch": 3.6460717009916097,
"grad_norm": 0.8202631465156636,
"learning_rate": 2.2039113480108333e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054891526699066,
"step": 4780,
"valid_targets_mean": 5119.5,
"valid_targets_min": 1388
},
{
"epoch": 3.6498855835240276,
"grad_norm": 0.4873756601176684,
"learning_rate": 2.2001269620734354e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3282296359539032,
"step": 4785,
"valid_targets_mean": 3815.8,
"valid_targets_min": 1194
},
{
"epoch": 3.6536994660564455,
"grad_norm": 0.4301975751639404,
"learning_rate": 2.1963418522165064e-05,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25355055928230286,
"step": 4790,
"valid_targets_mean": 4236.9,
"valid_targets_min": 757
},
{
"epoch": 3.6575133485888633,
"grad_norm": 0.502083577647879,
"learning_rate": 2.1925560321319292e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2781239449977875,
"step": 4795,
"valid_targets_mean": 3783.9,
"valid_targets_min": 366
},
{
"epoch": 3.6613272311212812,
"grad_norm": 0.4455469454708054,
"learning_rate": 2.1887695155141565e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768062651157379,
"step": 4800,
"valid_targets_mean": 4387.9,
"valid_targets_min": 437
},
{
"epoch": 3.6651411136536995,
"grad_norm": 0.43246638097368684,
"learning_rate": 2.1849823160601602e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30090662837028503,
"step": 4805,
"valid_targets_mean": 4708.5,
"valid_targets_min": 996
},
{
"epoch": 3.6689549961861174,
"grad_norm": 0.48013536906608734,
"learning_rate": 2.1811944474693812e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2882266342639923,
"step": 4810,
"valid_targets_mean": 3664.5,
"valid_targets_min": 1377
},
{
"epoch": 3.6727688787185357,
"grad_norm": 0.4215066962223358,
"learning_rate": 2.177405923443682e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31770798563957214,
"step": 4815,
"valid_targets_mean": 5157.8,
"valid_targets_min": 1195
},
{
"epoch": 3.6765827612509536,
"grad_norm": 0.4822129870662444,
"learning_rate": 2.173616757687296e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2803454101085663,
"step": 4820,
"valid_targets_mean": 4487.2,
"valid_targets_min": 1171
},
{
"epoch": 3.6803966437833715,
"grad_norm": 0.4518314070729709,
"learning_rate": 2.1698269639067772e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30212217569351196,
"step": 4825,
"valid_targets_mean": 4547.0,
"valid_targets_min": 807
},
{
"epoch": 3.6842105263157894,
"grad_norm": 0.4381394067728647,
"learning_rate": 2.1660365558109522e-05,
"loss": 0.2878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2651013433933258,
"step": 4830,
"valid_targets_mean": 4092.2,
"valid_targets_min": 460
},
{
"epoch": 3.6880244088482073,
"grad_norm": 0.4611168188871333,
"learning_rate": 2.162245547110869e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28754758834838867,
"step": 4835,
"valid_targets_mean": 4108.5,
"valid_targets_min": 1266
},
{
"epoch": 3.6918382913806256,
"grad_norm": 0.4216410388557109,
"learning_rate": 2.1584539515197476e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2530418336391449,
"step": 4840,
"valid_targets_mean": 4882.8,
"valid_targets_min": 1495
},
{
"epoch": 3.6956521739130435,
"grad_norm": 0.5101669538365097,
"learning_rate": 2.1546617827529337e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2959820330142975,
"step": 4845,
"valid_targets_mean": 3875.6,
"valid_targets_min": 567
},
{
"epoch": 3.6994660564454613,
"grad_norm": 0.4422043707591292,
"learning_rate": 2.1508690545278438e-05,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25045129656791687,
"step": 4850,
"valid_targets_mean": 4307.8,
"valid_targets_min": 513
},
{
"epoch": 3.7032799389778797,
"grad_norm": 0.48074229488333253,
"learning_rate": 2.1470757805639186e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2914007902145386,
"step": 4855,
"valid_targets_mean": 3635.8,
"valid_targets_min": 1182
},
{
"epoch": 3.7070938215102975,
"grad_norm": 0.4432598278262152,
"learning_rate": 2.1432819745825732e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.247156023979187,
"step": 4860,
"valid_targets_mean": 4326.8,
"valid_targets_min": 1113
},
{
"epoch": 3.7109077040427154,
"grad_norm": 0.43543523339515255,
"learning_rate": 2.139487650307147e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2991539537906647,
"step": 4865,
"valid_targets_mean": 4774.8,
"valid_targets_min": 1273
},
{
"epoch": 3.7147215865751333,
"grad_norm": 0.45320374074665914,
"learning_rate": 2.135692821462855e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2640787661075592,
"step": 4870,
"valid_targets_mean": 3983.8,
"valid_targets_min": 1240
},
{
"epoch": 3.7185354691075516,
"grad_norm": 0.4730272978195686,
"learning_rate": 2.131897501776736e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792348563671112,
"step": 4875,
"valid_targets_mean": 3923.6,
"valid_targets_min": 1350
},
{
"epoch": 3.7223493516399695,
"grad_norm": 0.46367011168212957,
"learning_rate": 2.128101704977605e-05,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26287421584129333,
"step": 4880,
"valid_targets_mean": 4225.2,
"valid_targets_min": 1065
},
{
"epoch": 3.7261632341723874,
"grad_norm": 0.45822132449926056,
"learning_rate": 2.124305444796003e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26010265946388245,
"step": 4885,
"valid_targets_mean": 4470.3,
"valid_targets_min": 1450
},
{
"epoch": 3.7299771167048057,
"grad_norm": 0.4999416286074579,
"learning_rate": 2.1205087349641474e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28680503368377686,
"step": 4890,
"valid_targets_mean": 4674.3,
"valid_targets_min": 1425
},
{
"epoch": 3.7337909992372236,
"grad_norm": 1.1021522685950285,
"learning_rate": 2.116711589215882e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29555997252464294,
"step": 4895,
"valid_targets_mean": 4395.1,
"valid_targets_min": 1035
},
{
"epoch": 3.7376048817696415,
"grad_norm": 0.4704972599874909,
"learning_rate": 2.1129140212866268e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726249694824219,
"step": 4900,
"valid_targets_mean": 4035.6,
"valid_targets_min": 390
},
{
"epoch": 3.7414187643020593,
"grad_norm": 0.4895949033004227,
"learning_rate": 2.1091160449133294e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2875785231590271,
"step": 4905,
"valid_targets_mean": 3985.5,
"valid_targets_min": 1161
},
{
"epoch": 3.7452326468344777,
"grad_norm": 0.4732839023835256,
"learning_rate": 2.105317673834415e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3635139465332031,
"step": 4910,
"valid_targets_mean": 4737.2,
"valid_targets_min": 759
},
{
"epoch": 3.7490465293668955,
"grad_norm": 0.7329967738195239,
"learning_rate": 2.1015189217897364e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3502159118652344,
"step": 4915,
"valid_targets_mean": 2071.2,
"valid_targets_min": 576
},
{
"epoch": 3.7528604118993134,
"grad_norm": 0.5373102096273961,
"learning_rate": 2.097719802520524e-05,
"loss": 0.4261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26391589641571045,
"step": 4920,
"valid_targets_mean": 3376.4,
"valid_targets_min": 1296
},
{
"epoch": 3.7566742944317317,
"grad_norm": 0.5099941176506099,
"learning_rate": 2.0939203297693384e-05,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25710639357566833,
"step": 4925,
"valid_targets_mean": 3332.5,
"valid_targets_min": 1082
},
{
"epoch": 3.7604881769641496,
"grad_norm": 0.46162219390203724,
"learning_rate": 2.090120517280017e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2861987054347992,
"step": 4930,
"valid_targets_mean": 4440.6,
"valid_targets_min": 440
},
{
"epoch": 3.7643020594965675,
"grad_norm": 0.4620294227163194,
"learning_rate": 2.086320378797626e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29089245200157166,
"step": 4935,
"valid_targets_mean": 4926.2,
"valid_targets_min": 1360
},
{
"epoch": 3.7681159420289854,
"grad_norm": 0.46269226142521863,
"learning_rate": 2.0825199280684122e-05,
"loss": 0.3014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26844826340675354,
"step": 4940,
"valid_targets_mean": 4640.1,
"valid_targets_min": 1372
},
{
"epoch": 3.7719298245614032,
"grad_norm": 0.44918665856402457,
"learning_rate": 2.0787191788397503e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886035144329071,
"step": 4945,
"valid_targets_mean": 4349.8,
"valid_targets_min": 1171
},
{
"epoch": 3.7757437070938216,
"grad_norm": 0.4611965587323673,
"learning_rate": 2.0749181448600967e-05,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3016029894351959,
"step": 4950,
"valid_targets_mean": 5051.3,
"valid_targets_min": 862
},
{
"epoch": 3.7795575896262394,
"grad_norm": 0.4769360159800852,
"learning_rate": 2.0711168398789364e-05,
"loss": 0.2796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291471391916275,
"step": 4955,
"valid_targets_mean": 3710.4,
"valid_targets_min": 1152
},
{
"epoch": 3.7833714721586578,
"grad_norm": 0.41686170733711136,
"learning_rate": 2.0673152776467343e-05,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24968425929546356,
"step": 4960,
"valid_targets_mean": 4307.1,
"valid_targets_min": 845
},
{
"epoch": 3.7871853546910756,
"grad_norm": 0.388968051713768,
"learning_rate": 2.0635134719148873e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2582361102104187,
"step": 4965,
"valid_targets_mean": 5233.7,
"valid_targets_min": 1220
},
{
"epoch": 3.7909992372234935,
"grad_norm": 0.4120063369566906,
"learning_rate": 2.0597114364356726e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2593841552734375,
"step": 4970,
"valid_targets_mean": 4571.8,
"valid_targets_min": 1065
},
{
"epoch": 3.7948131197559114,
"grad_norm": 0.42356900591636804,
"learning_rate": 2.0559091849621985e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2937016785144806,
"step": 4975,
"valid_targets_mean": 5643.4,
"valid_targets_min": 1265
},
{
"epoch": 3.7986270022883293,
"grad_norm": 0.404415109624401,
"learning_rate": 2.0521067312483535e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3042158782482147,
"step": 4980,
"valid_targets_mean": 5218.6,
"valid_targets_min": 559
},
{
"epoch": 3.8024408848207476,
"grad_norm": 0.4155431744232426,
"learning_rate": 2.048304089048759e-05,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21575789153575897,
"step": 4985,
"valid_targets_mean": 4188.2,
"valid_targets_min": 1059
},
{
"epoch": 3.8062547673531655,
"grad_norm": 0.46950574889200086,
"learning_rate": 2.044501272118718e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3153056502342224,
"step": 4990,
"valid_targets_mean": 3989.5,
"valid_targets_min": 581
},
{
"epoch": 3.8100686498855834,
"grad_norm": 0.43838438560538834,
"learning_rate": 2.0406982942141646e-05,
"loss": 0.2937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291579931974411,
"step": 4995,
"valid_targets_mean": 4621.1,
"valid_targets_min": 1325
},
{
"epoch": 3.8138825324180017,
"grad_norm": 0.44145322237824836,
"learning_rate": 2.0368951690916166e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2182352989912033,
"step": 5000,
"valid_targets_mean": 4515.5,
"valid_targets_min": 1668
},
{
"epoch": 3.8176964149504196,
"grad_norm": 0.4504621882289278,
"learning_rate": 2.0330919105081238e-05,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3026907742023468,
"step": 5005,
"valid_targets_mean": 4372.3,
"valid_targets_min": 415
},
{
"epoch": 3.8215102974828374,
"grad_norm": 0.4929531534573359,
"learning_rate": 2.0292885322212183e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27263951301574707,
"step": 5010,
"valid_targets_mean": 4319.9,
"valid_targets_min": 1306
},
{
"epoch": 3.8253241800152553,
"grad_norm": 0.41575043508311943,
"learning_rate": 2.0254850479888652e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930053770542145,
"step": 5015,
"valid_targets_mean": 5146.0,
"valid_targets_min": 577
},
{
"epoch": 3.8291380625476736,
"grad_norm": 0.4801883312541542,
"learning_rate": 2.021681471569414e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3446965515613556,
"step": 5020,
"valid_targets_mean": 4140.5,
"valid_targets_min": 1019
},
{
"epoch": 3.8329519450800915,
"grad_norm": 0.41216892152068585,
"learning_rate": 2.017877816721546e-05,
"loss": 0.2856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28163060545921326,
"step": 5025,
"valid_targets_mean": 4676.8,
"valid_targets_min": 400
},
{
"epoch": 3.8367658276125094,
"grad_norm": 0.4279433137988471,
"learning_rate": 2.0140740972042276e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602086365222931,
"step": 5030,
"valid_targets_mean": 4468.6,
"valid_targets_min": 1380
},
{
"epoch": 3.8405797101449277,
"grad_norm": 0.4665598041153684,
"learning_rate": 2.0102703267766584e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.312650591135025,
"step": 5035,
"valid_targets_mean": 4409.3,
"valid_targets_min": 841
},
{
"epoch": 3.8443935926773456,
"grad_norm": 0.44786662715514164,
"learning_rate": 2.006466519198222e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23634012043476105,
"step": 5040,
"valid_targets_mean": 5063.6,
"valid_targets_min": 751
},
{
"epoch": 3.8482074752097635,
"grad_norm": 0.4974521996462959,
"learning_rate": 2.0026626882284365e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2868984043598175,
"step": 5045,
"valid_targets_mean": 4401.0,
"valid_targets_min": 1068
},
{
"epoch": 3.8520213577421814,
"grad_norm": 0.4303348110695608,
"learning_rate": 1.998858847626906e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2536643147468567,
"step": 5050,
"valid_targets_mean": 4594.3,
"valid_targets_min": 1286
},
{
"epoch": 3.8558352402745997,
"grad_norm": 0.4798918018206437,
"learning_rate": 1.995055011153267e-05,
"loss": 0.2961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28693172335624695,
"step": 5055,
"valid_targets_mean": 3978.6,
"valid_targets_min": 1294
},
{
"epoch": 3.8596491228070176,
"grad_norm": 0.5833198149859566,
"learning_rate": 1.9912511925671428e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2774660289287567,
"step": 5060,
"valid_targets_mean": 4207.2,
"valid_targets_min": 1323
},
{
"epoch": 3.8634630053394354,
"grad_norm": 0.4438224992611823,
"learning_rate": 1.987447405628092e-05,
"loss": 0.3078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2594674825668335,
"step": 5065,
"valid_targets_mean": 5099.1,
"valid_targets_min": 1504
},
{
"epoch": 3.8672768878718538,
"grad_norm": 0.44237795466310065,
"learning_rate": 1.9836436640955578e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26847514510154724,
"step": 5070,
"valid_targets_mean": 4456.6,
"valid_targets_min": 1314
},
{
"epoch": 3.8710907704042716,
"grad_norm": 0.43779853479233827,
"learning_rate": 1.9798399817288197e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27755558490753174,
"step": 5075,
"valid_targets_mean": 4562.6,
"valid_targets_min": 927
},
{
"epoch": 3.8749046529366895,
"grad_norm": 1.14893712269878,
"learning_rate": 1.976036372286943e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41553497314453125,
"step": 5080,
"valid_targets_mean": 1294.0,
"valid_targets_min": 629
},
{
"epoch": 3.8787185354691074,
"grad_norm": 0.505426898880738,
"learning_rate": 1.972232849528729e-05,
"loss": 0.4263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2346818894147873,
"step": 5085,
"valid_targets_mean": 4294.2,
"valid_targets_min": 1401
},
{
"epoch": 3.8825324180015257,
"grad_norm": 0.44319385303652004,
"learning_rate": 1.9684294272126662e-05,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27154862880706787,
"step": 5090,
"valid_targets_mean": 4119.6,
"valid_targets_min": 1432
},
{
"epoch": 3.8863463005339436,
"grad_norm": 0.5459021377392329,
"learning_rate": 1.9646261190968787e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32108262181282043,
"step": 5095,
"valid_targets_mean": 4003.6,
"valid_targets_min": 957
},
{
"epoch": 3.8901601830663615,
"grad_norm": 0.42387804406963075,
"learning_rate": 1.9608229389390786e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090623915195465,
"step": 5100,
"valid_targets_mean": 4897.4,
"valid_targets_min": 2186
},
{
"epoch": 3.89397406559878,
"grad_norm": 0.49421705023909407,
"learning_rate": 1.9570199004965146e-05,
"loss": 0.2903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32566288113594055,
"step": 5105,
"valid_targets_mean": 4511.8,
"valid_targets_min": 1021
},
{
"epoch": 3.8977879481311977,
"grad_norm": 0.4668014379335834,
"learning_rate": 1.9532170175259225e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2344411164522171,
"step": 5110,
"valid_targets_mean": 4368.4,
"valid_targets_min": 480
},
{
"epoch": 3.9016018306636155,
"grad_norm": 0.43277753403218727,
"learning_rate": 1.9494143037834778e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30218103528022766,
"step": 5115,
"valid_targets_mean": 4824.0,
"valid_targets_min": 447
},
{
"epoch": 3.9054157131960334,
"grad_norm": 0.4156421333456064,
"learning_rate": 1.945611773024739e-05,
"loss": 0.2942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27466729283332825,
"step": 5120,
"valid_targets_mean": 4651.5,
"valid_targets_min": 1039
},
{
"epoch": 3.9092295957284513,
"grad_norm": 0.47060667981939347,
"learning_rate": 1.941809439004607e-05,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.269515722990036,
"step": 5125,
"valid_targets_mean": 3880.5,
"valid_targets_min": 1031
},
{
"epoch": 3.9130434782608696,
"grad_norm": 0.43145818157727733,
"learning_rate": 1.9380073154772707e-05,
"loss": 0.2929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2653549909591675,
"step": 5130,
"valid_targets_mean": 4223.7,
"valid_targets_min": 1216
},
{
"epoch": 3.9168573607932875,
"grad_norm": 0.4877286412806023,
"learning_rate": 1.934205416196156e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2932646572589874,
"step": 5135,
"valid_targets_mean": 3868.4,
"valid_targets_min": 898
},
{
"epoch": 3.920671243325706,
"grad_norm": 0.41908844260246153,
"learning_rate": 1.9304037549138783e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29270559549331665,
"step": 5140,
"valid_targets_mean": 4753.8,
"valid_targets_min": 786
},
{
"epoch": 3.9244851258581237,
"grad_norm": 0.4784502269230572,
"learning_rate": 1.926602345382192e-05,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063240647315979,
"step": 5145,
"valid_targets_mean": 4156.7,
"valid_targets_min": 830
},
{
"epoch": 3.9282990083905416,
"grad_norm": 0.4343307443707409,
"learning_rate": 1.9228012013519414e-05,
"loss": 0.2806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735506296157837,
"step": 5150,
"valid_targets_mean": 4672.8,
"valid_targets_min": 589
},
{
"epoch": 3.9321128909229595,
"grad_norm": 0.4300181559503131,
"learning_rate": 1.9190003365730096e-05,
"loss": 0.298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812347710132599,
"step": 5155,
"valid_targets_mean": 5184.3,
"valid_targets_min": 257
},
{
"epoch": 3.9359267734553773,
"grad_norm": 0.4368057207707122,
"learning_rate": 1.9151997647942702e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31642988324165344,
"step": 5160,
"valid_targets_mean": 5125.9,
"valid_targets_min": 1586
},
{
"epoch": 3.9397406559877957,
"grad_norm": 0.5006746338061084,
"learning_rate": 1.9113994997635362e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3068694472312927,
"step": 5165,
"valid_targets_mean": 3927.8,
"valid_targets_min": 1098
},
{
"epoch": 3.9435545385202135,
"grad_norm": 0.479151537271904,
"learning_rate": 1.9075995552275112e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3017423450946808,
"step": 5170,
"valid_targets_mean": 4141.9,
"valid_targets_min": 949
},
{
"epoch": 3.9473684210526314,
"grad_norm": 0.46514469000401915,
"learning_rate": 1.9037999449317406e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28211966156959534,
"step": 5175,
"valid_targets_mean": 4282.8,
"valid_targets_min": 787
},
{
"epoch": 3.9511823035850497,
"grad_norm": 0.4460611254139414,
"learning_rate": 1.9000006826205594e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28090232610702515,
"step": 5180,
"valid_targets_mean": 4177.1,
"valid_targets_min": 1063
},
{
"epoch": 3.9549961861174676,
"grad_norm": 0.4391877582917011,
"learning_rate": 1.8962017820370443e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.282697468996048,
"step": 5185,
"valid_targets_mean": 4237.3,
"valid_targets_min": 903
},
{
"epoch": 3.9588100686498855,
"grad_norm": 0.4187783195267498,
"learning_rate": 1.892403256922964e-05,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23168055713176727,
"step": 5190,
"valid_targets_mean": 4525.2,
"valid_targets_min": 528
},
{
"epoch": 3.9626239511823034,
"grad_norm": 0.4528277753081471,
"learning_rate": 1.8886051210187277e-05,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916136085987091,
"step": 5195,
"valid_targets_mean": 4180.0,
"valid_targets_min": 906
},
{
"epoch": 3.9664378337147217,
"grad_norm": 0.5162672915536458,
"learning_rate": 1.884807388063338e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28006768226623535,
"step": 5200,
"valid_targets_mean": 3554.5,
"valid_targets_min": 837
},
{
"epoch": 3.9702517162471396,
"grad_norm": 0.421583313476623,
"learning_rate": 1.8810100717943393e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28844282031059265,
"step": 5205,
"valid_targets_mean": 4721.1,
"valid_targets_min": 957
},
{
"epoch": 3.9740655987795575,
"grad_norm": 0.419280792206997,
"learning_rate": 1.877213185947769e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26939424872398376,
"step": 5210,
"valid_targets_mean": 4626.4,
"valid_targets_min": 1120
},
{
"epoch": 3.9778794813119758,
"grad_norm": 0.4629473209847183,
"learning_rate": 1.8734167442581072e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24810916185379028,
"step": 5215,
"valid_targets_mean": 4065.1,
"valid_targets_min": 871
},
{
"epoch": 3.9816933638443937,
"grad_norm": 0.5118809234713598,
"learning_rate": 1.869620760458228e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3038460314273834,
"step": 5220,
"valid_targets_mean": 3327.3,
"valid_targets_min": 1278
},
{
"epoch": 3.9855072463768115,
"grad_norm": 0.5035213322974476,
"learning_rate": 1.8658252482793485e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.292995423078537,
"step": 5225,
"valid_targets_mean": 4340.3,
"valid_targets_min": 1044
},
{
"epoch": 3.9893211289092294,
"grad_norm": 0.42529772495906987,
"learning_rate": 1.8620302214509804e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23590444028377533,
"step": 5230,
"valid_targets_mean": 3947.8,
"valid_targets_min": 258
},
{
"epoch": 3.9931350114416477,
"grad_norm": 0.4357103197502,
"learning_rate": 1.8582356937008785e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24585048854351044,
"step": 5235,
"valid_targets_mean": 5009.6,
"valid_targets_min": 708
},
{
"epoch": 3.9969488939740656,
"grad_norm": 0.3816166815814907,
"learning_rate": 1.8544416787549942e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2795417308807373,
"step": 5240,
"valid_targets_mean": 5411.3,
"valid_targets_min": 751
},
{
"epoch": 4.000762776506484,
"grad_norm": 0.5416479526027371,
"learning_rate": 1.850648190337422e-05,
"loss": 0.487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27904537320137024,
"step": 5245,
"valid_targets_mean": 3583.6,
"valid_targets_min": 1165
},
{
"epoch": 4.004576659038902,
"grad_norm": 0.5087452060708784,
"learning_rate": 1.8468552421703535e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31443047523498535,
"step": 5250,
"valid_targets_mean": 3674.5,
"valid_targets_min": 1189
},
{
"epoch": 4.00839054157132,
"grad_norm": 0.47920887196013023,
"learning_rate": 1.8430628479740243e-05,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631620168685913,
"step": 5255,
"valid_targets_mean": 4028.5,
"valid_targets_min": 732
},
{
"epoch": 4.012204424103738,
"grad_norm": 0.43552125958300064,
"learning_rate": 1.839271021466668e-05,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28635895252227783,
"step": 5260,
"valid_targets_mean": 5221.5,
"valid_targets_min": 1206
},
{
"epoch": 4.016018306636155,
"grad_norm": 0.46905637576964415,
"learning_rate": 1.8354797763644628e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725812494754791,
"step": 5265,
"valid_targets_mean": 4305.4,
"valid_targets_min": 1119
},
{
"epoch": 4.019832189168573,
"grad_norm": 0.43349093244065384,
"learning_rate": 1.831689126381486e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30661433935165405,
"step": 5270,
"valid_targets_mean": 4936.6,
"valid_targets_min": 1143
},
{
"epoch": 4.023646071700991,
"grad_norm": 0.4918320057290233,
"learning_rate": 1.8278990852296598e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25690630078315735,
"step": 5275,
"valid_targets_mean": 3922.7,
"valid_targets_min": 403
},
{
"epoch": 4.02745995423341,
"grad_norm": 0.42458062947621084,
"learning_rate": 1.824109666618706e-05,
"loss": 0.2913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30049416422843933,
"step": 5280,
"valid_targets_mean": 4960.4,
"valid_targets_min": 1542
},
{
"epoch": 4.031273836765828,
"grad_norm": 0.39963645779686524,
"learning_rate": 1.820320884256093e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23063836991786957,
"step": 5285,
"valid_targets_mean": 4685.0,
"valid_targets_min": 1292
},
{
"epoch": 4.035087719298246,
"grad_norm": 0.41970732682492695,
"learning_rate": 1.8165327518469888e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22459344565868378,
"step": 5290,
"valid_targets_mean": 4371.2,
"valid_targets_min": 794
},
{
"epoch": 4.038901601830664,
"grad_norm": 0.4908945778200589,
"learning_rate": 1.8127452830942097e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542988359928131,
"step": 5295,
"valid_targets_mean": 4042.7,
"valid_targets_min": 398
},
{
"epoch": 4.0427154843630815,
"grad_norm": 0.435112076490909,
"learning_rate": 1.8089584916981714e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22995798289775848,
"step": 5300,
"valid_targets_mean": 4469.0,
"valid_targets_min": 1104
},
{
"epoch": 4.046529366895499,
"grad_norm": 0.496497698029133,
"learning_rate": 1.8051723913568393e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845947742462158,
"step": 5305,
"valid_targets_mean": 3867.3,
"valid_targets_min": 428
},
{
"epoch": 4.050343249427917,
"grad_norm": 0.4521890524780476,
"learning_rate": 1.80138699576568e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707526981830597,
"step": 5310,
"valid_targets_mean": 4219.8,
"valid_targets_min": 932
},
{
"epoch": 4.054157131960336,
"grad_norm": 0.44957196568861707,
"learning_rate": 1.7976023186176102e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266658216714859,
"step": 5315,
"valid_targets_mean": 4021.2,
"valid_targets_min": 671
},
{
"epoch": 4.057971014492754,
"grad_norm": 0.43451221759899866,
"learning_rate": 1.7938183736029473e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787042558193207,
"step": 5320,
"valid_targets_mean": 4478.9,
"valid_targets_min": 1003
},
{
"epoch": 4.061784897025172,
"grad_norm": 0.4092319501876168,
"learning_rate": 1.7900351744093604e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2590319812297821,
"step": 5325,
"valid_targets_mean": 4576.3,
"valid_targets_min": 941
},
{
"epoch": 4.06559877955759,
"grad_norm": 0.44767830732575387,
"learning_rate": 1.7862527347218213e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27546316385269165,
"step": 5330,
"valid_targets_mean": 4749.5,
"valid_targets_min": 857
},
{
"epoch": 4.0694126620900075,
"grad_norm": 0.4185953444093869,
"learning_rate": 1.7824710682225546e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29678523540496826,
"step": 5335,
"valid_targets_mean": 5015.9,
"valid_targets_min": 1048
},
{
"epoch": 4.073226544622425,
"grad_norm": 0.5216767400389845,
"learning_rate": 1.7786901885909872e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2771632969379425,
"step": 5340,
"valid_targets_mean": 3328.6,
"valid_targets_min": 531
},
{
"epoch": 4.077040427154843,
"grad_norm": 0.462063501870652,
"learning_rate": 1.7749101095037004e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24681317806243896,
"step": 5345,
"valid_targets_mean": 4025.9,
"valid_targets_min": 690
},
{
"epoch": 4.080854309687262,
"grad_norm": 0.45346407117733667,
"learning_rate": 1.7711308446343787e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28253352642059326,
"step": 5350,
"valid_targets_mean": 4707.8,
"valid_targets_min": 1112
},
{
"epoch": 4.08466819221968,
"grad_norm": 0.4785053811062835,
"learning_rate": 1.7673524076537628e-05,
"loss": 0.291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29810595512390137,
"step": 5355,
"valid_targets_mean": 4859.3,
"valid_targets_min": 1050
},
{
"epoch": 4.088482074752098,
"grad_norm": 0.4308493569201197,
"learning_rate": 1.7635748122295978e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24559128284454346,
"step": 5360,
"valid_targets_mean": 4339.5,
"valid_targets_min": 433
},
{
"epoch": 4.092295957284516,
"grad_norm": 0.48191302755325544,
"learning_rate": 1.7597980720265846e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28685423731803894,
"step": 5365,
"valid_targets_mean": 4426.0,
"valid_targets_min": 963
},
{
"epoch": 4.0961098398169336,
"grad_norm": 0.4875942242372229,
"learning_rate": 1.7560222007063308e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2825605869293213,
"step": 5370,
"valid_targets_mean": 4379.4,
"valid_targets_min": 1093
},
{
"epoch": 4.099923722349351,
"grad_norm": 0.5047475576226177,
"learning_rate": 1.7522472119273004e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2979480028152466,
"step": 5375,
"valid_targets_mean": 4211.3,
"valid_targets_min": 994
},
{
"epoch": 4.103737604881769,
"grad_norm": 0.47812820392617394,
"learning_rate": 1.7484731193447658e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2687206268310547,
"step": 5380,
"valid_targets_mean": 3960.5,
"valid_targets_min": 594
},
{
"epoch": 4.107551487414188,
"grad_norm": 0.4620874475188822,
"learning_rate": 1.7446999366107574e-05,
"loss": 0.2939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30755627155303955,
"step": 5385,
"valid_targets_mean": 4346.6,
"valid_targets_min": 907
},
{
"epoch": 4.111365369946606,
"grad_norm": 0.5480698360224027,
"learning_rate": 1.7409276773740136e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27984118461608887,
"step": 5390,
"valid_targets_mean": 2910.8,
"valid_targets_min": 1225
},
{
"epoch": 4.115179252479024,
"grad_norm": 0.433621353490338,
"learning_rate": 1.737156355279933e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788759171962738,
"step": 5395,
"valid_targets_mean": 5113.2,
"valid_targets_min": 1293
},
{
"epoch": 4.118993135011442,
"grad_norm": 0.4639434128116733,
"learning_rate": 1.7333859839705246e-05,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772332727909088,
"step": 5400,
"valid_targets_mean": 4186.8,
"valid_targets_min": 1279
},
{
"epoch": 4.12280701754386,
"grad_norm": 1.579151123306477,
"learning_rate": 1.7296165770843573e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5295971632003784,
"step": 5405,
"valid_targets_mean": 806.0,
"valid_targets_min": 581
},
{
"epoch": 4.1266209000762775,
"grad_norm": 0.5105839768882346,
"learning_rate": 1.7258481482565118e-05,
"loss": 0.3805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567860186100006,
"step": 5410,
"valid_targets_mean": 3869.5,
"valid_targets_min": 1174
},
{
"epoch": 4.130434782608695,
"grad_norm": 0.44640858073953466,
"learning_rate": 1.722080711118531e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31472137570381165,
"step": 5415,
"valid_targets_mean": 4932.8,
"valid_targets_min": 696
},
{
"epoch": 4.134248665141113,
"grad_norm": 0.5039903115695159,
"learning_rate": 1.7183142792983697e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32861748337745667,
"step": 5420,
"valid_targets_mean": 4283.7,
"valid_targets_min": 336
},
{
"epoch": 4.138062547673532,
"grad_norm": 0.45734018055533465,
"learning_rate": 1.714548866420348e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520674169063568,
"step": 5425,
"valid_targets_mean": 4151.8,
"valid_targets_min": 1003
},
{
"epoch": 4.14187643020595,
"grad_norm": 0.5200103424217448,
"learning_rate": 1.710784486105098e-05,
"loss": 0.2872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3251253664493561,
"step": 5430,
"valid_targets_mean": 3897.5,
"valid_targets_min": 1039
},
{
"epoch": 4.145690312738368,
"grad_norm": 0.4458129550534968,
"learning_rate": 1.7070211519695176e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35341396927833557,
"step": 5435,
"valid_targets_mean": 5133.9,
"valid_targets_min": 967
},
{
"epoch": 4.149504195270786,
"grad_norm": 0.4420239232383797,
"learning_rate": 1.7032588776267208e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33999934792518616,
"step": 5440,
"valid_targets_mean": 4732.2,
"valid_targets_min": 1318
},
{
"epoch": 4.1533180778032035,
"grad_norm": 0.4741109970058931,
"learning_rate": 1.699497676685988e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29192444682121277,
"step": 5445,
"valid_targets_mean": 4110.2,
"valid_targets_min": 825
},
{
"epoch": 4.157131960335621,
"grad_norm": 0.4178824184918611,
"learning_rate": 1.695737562752716e-05,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533215880393982,
"step": 5450,
"valid_targets_mean": 4636.5,
"valid_targets_min": 716
},
{
"epoch": 4.160945842868039,
"grad_norm": 0.4723531617223507,
"learning_rate": 1.6919785494283704e-05,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707185745239258,
"step": 5455,
"valid_targets_mean": 3819.3,
"valid_targets_min": 706
},
{
"epoch": 4.164759725400458,
"grad_norm": 0.48034451668280265,
"learning_rate": 1.6882206503104345e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29053595662117004,
"step": 5460,
"valid_targets_mean": 4347.7,
"valid_targets_min": 828
},
{
"epoch": 4.168573607932876,
"grad_norm": 0.5341006587681983,
"learning_rate": 1.6844638789923626e-05,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31795796751976013,
"step": 5465,
"valid_targets_mean": 3255.6,
"valid_targets_min": 873
},
{
"epoch": 4.172387490465294,
"grad_norm": 0.46299043551009134,
"learning_rate": 1.680708249063528e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508344352245331,
"step": 5470,
"valid_targets_mean": 4260.3,
"valid_targets_min": 831
},
{
"epoch": 4.176201372997712,
"grad_norm": 0.45616141827399853,
"learning_rate": 1.676953774109177e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717251777648926,
"step": 5475,
"valid_targets_mean": 4702.5,
"valid_targets_min": 1005
},
{
"epoch": 4.1800152555301295,
"grad_norm": 0.42401454170133096,
"learning_rate": 1.6732004677103758e-05,
"loss": 0.2904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29828864336013794,
"step": 5480,
"valid_targets_mean": 4791.1,
"valid_targets_min": 1118
},
{
"epoch": 4.183829138062547,
"grad_norm": 0.4527669070004305,
"learning_rate": 1.6694483434439656e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25608429312705994,
"step": 5485,
"valid_targets_mean": 4262.0,
"valid_targets_min": 1530
},
{
"epoch": 4.187643020594965,
"grad_norm": 0.4816221826659873,
"learning_rate": 1.66569741488251e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672211229801178,
"step": 5490,
"valid_targets_mean": 3935.8,
"valid_targets_min": 903
},
{
"epoch": 4.191456903127384,
"grad_norm": 0.4901532290032959,
"learning_rate": 1.6619476955942482e-05,
"loss": 0.2756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2634734511375427,
"step": 5495,
"valid_targets_mean": 3706.3,
"valid_targets_min": 530
},
{
"epoch": 4.195270785659802,
"grad_norm": 0.44500826527307435,
"learning_rate": 1.6581991991430445e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2523365914821625,
"step": 5500,
"valid_targets_mean": 4076.1,
"valid_targets_min": 1141
},
{
"epoch": 4.19908466819222,
"grad_norm": 0.42766997819820646,
"learning_rate": 1.654451939088341e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672201097011566,
"step": 5505,
"valid_targets_mean": 5251.6,
"valid_targets_min": 1450
},
{
"epoch": 4.202898550724638,
"grad_norm": 0.5025906795175384,
"learning_rate": 1.6507059289851057e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3079371154308319,
"step": 5510,
"valid_targets_mean": 4642.8,
"valid_targets_min": 1081
},
{
"epoch": 4.206712433257056,
"grad_norm": 0.48921213724608315,
"learning_rate": 1.646961182383786e-05,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2763393819332123,
"step": 5515,
"valid_targets_mean": 3639.0,
"valid_targets_min": 1086
},
{
"epoch": 4.2105263157894735,
"grad_norm": 0.45072246512454434,
"learning_rate": 1.6432177128302597e-05,
"loss": 0.2775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3000883460044861,
"step": 5520,
"valid_targets_mean": 5069.9,
"valid_targets_min": 1688
},
{
"epoch": 4.214340198321891,
"grad_norm": 0.45130665609379705,
"learning_rate": 1.639475533865784e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28898870944976807,
"step": 5525,
"valid_targets_mean": 4288.3,
"valid_targets_min": 1208
},
{
"epoch": 4.21815408085431,
"grad_norm": 0.45781620819851476,
"learning_rate": 1.6357346590269477e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28579166531562805,
"step": 5530,
"valid_targets_mean": 4843.5,
"valid_targets_min": 1194
},
{
"epoch": 4.221967963386728,
"grad_norm": 0.4758765538089831,
"learning_rate": 1.631995101845622e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3063182532787323,
"step": 5535,
"valid_targets_mean": 4466.1,
"valid_targets_min": 880
},
{
"epoch": 4.225781845919146,
"grad_norm": 0.45531261671036943,
"learning_rate": 1.6282568758489132e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3045072853565216,
"step": 5540,
"valid_targets_mean": 4690.0,
"valid_targets_min": 1236
},
{
"epoch": 4.229595728451564,
"grad_norm": 0.4263889830178174,
"learning_rate": 1.6245199945591105e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29434555768966675,
"step": 5545,
"valid_targets_mean": 5107.2,
"valid_targets_min": 487
},
{
"epoch": 4.233409610983982,
"grad_norm": 0.49067696246605885,
"learning_rate": 1.6207844714936395e-05,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3065944015979767,
"step": 5550,
"valid_targets_mean": 4363.1,
"valid_targets_min": 458
},
{
"epoch": 4.2372234935163995,
"grad_norm": 0.40948653083424746,
"learning_rate": 1.6170503201650137e-05,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20808136463165283,
"step": 5555,
"valid_targets_mean": 4294.9,
"valid_targets_min": 966
},
{
"epoch": 4.241037376048817,
"grad_norm": 0.5026832111641061,
"learning_rate": 1.6133175540807824e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2692430317401886,
"step": 5560,
"valid_targets_mean": 3893.9,
"valid_targets_min": 413
},
{
"epoch": 4.244851258581235,
"grad_norm": 0.4125233801311475,
"learning_rate": 1.6095861867434867e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32503649592399597,
"step": 5565,
"valid_targets_mean": 5176.9,
"valid_targets_min": 1670
},
{
"epoch": 4.248665141113654,
"grad_norm": 1.5198766849042715,
"learning_rate": 1.6058562316506067e-05,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5387596487998962,
"step": 5570,
"valid_targets_mean": 810.6,
"valid_targets_min": 535
},
{
"epoch": 4.252479023646072,
"grad_norm": 0.5345120185370117,
"learning_rate": 1.602127702294513e-05,
"loss": 0.4276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2753293514251709,
"step": 5575,
"valid_targets_mean": 4129.8,
"valid_targets_min": 1107
},
{
"epoch": 4.25629290617849,
"grad_norm": 0.42624283846744887,
"learning_rate": 1.598400612162421e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2693823575973511,
"step": 5580,
"valid_targets_mean": 4639.1,
"valid_targets_min": 1095
},
{
"epoch": 4.260106788710908,
"grad_norm": 0.4621944129281794,
"learning_rate": 1.5946749747363378e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092004060745239,
"step": 5585,
"valid_targets_mean": 4519.8,
"valid_targets_min": 1406
},
{
"epoch": 4.2639206712433255,
"grad_norm": 0.427116201066583,
"learning_rate": 1.5909508034930174e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3015022873878479,
"step": 5590,
"valid_targets_mean": 4776.9,
"valid_targets_min": 612
},
{
"epoch": 4.267734553775743,
"grad_norm": 0.4772384606050245,
"learning_rate": 1.5872281119039092e-05,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26618143916130066,
"step": 5595,
"valid_targets_mean": 4011.5,
"valid_targets_min": 1010
},
{
"epoch": 4.271548436308162,
"grad_norm": 0.46352271693533037,
"learning_rate": 1.583506913435111e-05,
"loss": 0.2951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845820486545563,
"step": 5600,
"valid_targets_mean": 4406.2,
"valid_targets_min": 637
},
{
"epoch": 4.27536231884058,
"grad_norm": 0.42304973311417576,
"learning_rate": 1.579787221547318e-05,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28748199343681335,
"step": 5605,
"valid_targets_mean": 4840.3,
"valid_targets_min": 419
},
{
"epoch": 4.279176201372998,
"grad_norm": 0.426975836904547,
"learning_rate": 1.5760690496957777e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26385220885276794,
"step": 5610,
"valid_targets_mean": 4914.1,
"valid_targets_min": 402
},
{
"epoch": 4.282990083905416,
"grad_norm": 0.48513234007763295,
"learning_rate": 1.5723524113302385e-05,
"loss": 0.2883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2918134033679962,
"step": 5615,
"valid_targets_mean": 4047.7,
"valid_targets_min": 980
},
{
"epoch": 4.286803966437834,
"grad_norm": 0.49163740430944686,
"learning_rate": 1.5686373198949e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23882454633712769,
"step": 5620,
"valid_targets_mean": 3536.7,
"valid_targets_min": 632
},
{
"epoch": 4.290617848970252,
"grad_norm": 0.46719163433098254,
"learning_rate": 1.564923788828369e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26404812932014465,
"step": 5625,
"valid_targets_mean": 4187.7,
"valid_targets_min": 1076
},
{
"epoch": 4.294431731502669,
"grad_norm": 0.45690373458159445,
"learning_rate": 1.5612118315636052e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3266724646091461,
"step": 5630,
"valid_targets_mean": 4868.3,
"valid_targets_min": 1105
},
{
"epoch": 4.298245614035087,
"grad_norm": 0.41999328222502763,
"learning_rate": 1.557501461527877e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27965047955513,
"step": 5635,
"valid_targets_mean": 5149.8,
"valid_targets_min": 1460
},
{
"epoch": 4.302059496567506,
"grad_norm": 0.46175536669142053,
"learning_rate": 1.5537926921427116e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27793920040130615,
"step": 5640,
"valid_targets_mean": 4480.2,
"valid_targets_min": 1324
},
{
"epoch": 4.305873379099924,
"grad_norm": 0.42147544339206316,
"learning_rate": 1.5500855368238442e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257891982793808,
"step": 5645,
"valid_targets_mean": 5117.4,
"valid_targets_min": 1220
},
{
"epoch": 4.309687261632342,
"grad_norm": 0.44482482821139985,
"learning_rate": 1.5463800089811743e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24403272569179535,
"step": 5650,
"valid_targets_mean": 4186.8,
"valid_targets_min": 1146
},
{
"epoch": 4.31350114416476,
"grad_norm": 0.4599350132288009,
"learning_rate": 1.542676122018712e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24115292727947235,
"step": 5655,
"valid_targets_mean": 3831.2,
"valid_targets_min": 253
},
{
"epoch": 4.317315026697178,
"grad_norm": 0.49875170980568123,
"learning_rate": 1.5389738893345324e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.234399676322937,
"step": 5660,
"valid_targets_mean": 3607.4,
"valid_targets_min": 1042
},
{
"epoch": 4.3211289092295955,
"grad_norm": 0.46862374247924743,
"learning_rate": 1.5352733243207272e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704668939113617,
"step": 5665,
"valid_targets_mean": 4192.1,
"valid_targets_min": 977
},
{
"epoch": 4.324942791762013,
"grad_norm": 0.4704412496016771,
"learning_rate": 1.531574440363355e-05,
"loss": 0.2787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31678804755210876,
"step": 5670,
"valid_targets_mean": 4463.8,
"valid_targets_min": 422
},
{
"epoch": 4.328756674294432,
"grad_norm": 0.46882886163215814,
"learning_rate": 1.527877250842394e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2824307382106781,
"step": 5675,
"valid_targets_mean": 3865.7,
"valid_targets_min": 872
},
{
"epoch": 4.33257055682685,
"grad_norm": 0.465191078872391,
"learning_rate": 1.524181769131693e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30152150988578796,
"step": 5680,
"valid_targets_mean": 4387.8,
"valid_targets_min": 1158
},
{
"epoch": 4.336384439359268,
"grad_norm": 0.4866591622076078,
"learning_rate": 1.5204880085989222e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2841610610485077,
"step": 5685,
"valid_targets_mean": 3781.8,
"valid_targets_min": 952
},
{
"epoch": 4.340198321891686,
"grad_norm": 0.45140279740309064,
"learning_rate": 1.5167959826055269e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30225178599357605,
"step": 5690,
"valid_targets_mean": 4454.2,
"valid_targets_min": 1011
},
{
"epoch": 4.344012204424104,
"grad_norm": 0.4653747607523385,
"learning_rate": 1.5131057045066783e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2756575345993042,
"step": 5695,
"valid_targets_mean": 4502.6,
"valid_targets_min": 1432
},
{
"epoch": 4.3478260869565215,
"grad_norm": 0.45942886046871895,
"learning_rate": 1.5094171876512241e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24686582386493683,
"step": 5700,
"valid_targets_mean": 3902.8,
"valid_targets_min": 1109
},
{
"epoch": 4.351639969488939,
"grad_norm": 0.5051926834497391,
"learning_rate": 1.505730445381641e-05,
"loss": 0.2852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2773900330066681,
"step": 5705,
"valid_targets_mean": 3772.5,
"valid_targets_min": 315
},
{
"epoch": 4.355453852021358,
"grad_norm": 0.4440379992293962,
"learning_rate": 1.5020454910339872e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24155227839946747,
"step": 5710,
"valid_targets_mean": 4127.8,
"valid_targets_min": 1115
},
{
"epoch": 4.359267734553776,
"grad_norm": 0.44963486053345575,
"learning_rate": 1.4983623379378527e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28549474477767944,
"step": 5715,
"valid_targets_mean": 4378.5,
"valid_targets_min": 852
},
{
"epoch": 4.363081617086194,
"grad_norm": 0.4472315426767612,
"learning_rate": 1.4946809994163123e-05,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27043840289115906,
"step": 5720,
"valid_targets_mean": 4515.4,
"valid_targets_min": 1133
},
{
"epoch": 4.366895499618612,
"grad_norm": 0.49041276551147356,
"learning_rate": 1.4910014887858771e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672957479953766,
"step": 5725,
"valid_targets_mean": 4044.7,
"valid_targets_min": 957
},
{
"epoch": 4.37070938215103,
"grad_norm": 0.5021537373097715,
"learning_rate": 1.4873238193564453e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.256434828042984,
"step": 5730,
"valid_targets_mean": 3531.8,
"valid_targets_min": 1157
},
{
"epoch": 4.3745232646834475,
"grad_norm": 1.5771455277598134,
"learning_rate": 1.4836480044312554e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5025232434272766,
"step": 5735,
"valid_targets_mean": 835.1,
"valid_targets_min": 688
},
{
"epoch": 4.378337147215865,
"grad_norm": 0.48611824526015895,
"learning_rate": 1.4799740573068387e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29094183444976807,
"step": 5740,
"valid_targets_mean": 4893.0,
"valid_targets_min": 1417
},
{
"epoch": 4.382151029748284,
"grad_norm": 0.4538885965811372,
"learning_rate": 1.4763019912729694e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26907357573509216,
"step": 5745,
"valid_targets_mean": 4450.6,
"valid_targets_min": 515
},
{
"epoch": 4.385964912280702,
"grad_norm": 0.4542783244954703,
"learning_rate": 1.472631819612615e-05,
"loss": 0.2828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27067530155181885,
"step": 5750,
"valid_targets_mean": 4019.0,
"valid_targets_min": 1012
},
{
"epoch": 4.38977879481312,
"grad_norm": 0.49891633273896363,
"learning_rate": 1.468963555601894e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28321823477745056,
"step": 5755,
"valid_targets_mean": 3763.9,
"valid_targets_min": 359
},
{
"epoch": 4.393592677345538,
"grad_norm": 0.4473374870727865,
"learning_rate": 1.4652972125100217e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2813161611557007,
"step": 5760,
"valid_targets_mean": 4015.6,
"valid_targets_min": 621
},
{
"epoch": 4.397406559877956,
"grad_norm": 0.467832789716142,
"learning_rate": 1.4616328035992667e-05,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26224663853645325,
"step": 5765,
"valid_targets_mean": 3888.2,
"valid_targets_min": 896
},
{
"epoch": 4.401220442410374,
"grad_norm": 0.43705587434793697,
"learning_rate": 1.4579703421249e-05,
"loss": 0.2834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30531108379364014,
"step": 5770,
"valid_targets_mean": 5288.5,
"valid_targets_min": 1568
},
{
"epoch": 4.4050343249427915,
"grad_norm": 0.4256869545786574,
"learning_rate": 1.4543098413351486e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970990240573883,
"step": 5775,
"valid_targets_mean": 5047.0,
"valid_targets_min": 881
},
{
"epoch": 4.408848207475209,
"grad_norm": 0.43583173290283295,
"learning_rate": 1.4506513144711472e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30243197083473206,
"step": 5780,
"valid_targets_mean": 5445.3,
"valid_targets_min": 1961
},
{
"epoch": 4.412662090007628,
"grad_norm": 0.45939499966153063,
"learning_rate": 1.4469947747668895e-05,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970567047595978,
"step": 5785,
"valid_targets_mean": 4571.8,
"valid_targets_min": 1102
},
{
"epoch": 4.416475972540046,
"grad_norm": 0.39838106818527075,
"learning_rate": 1.4433402354491818e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2937869727611542,
"step": 5790,
"valid_targets_mean": 5518.0,
"valid_targets_min": 1383
},
{
"epoch": 4.420289855072464,
"grad_norm": 0.4420135944332066,
"learning_rate": 1.4396877097375942e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33492088317871094,
"step": 5795,
"valid_targets_mean": 5061.8,
"valid_targets_min": 973
},
{
"epoch": 4.424103737604882,
"grad_norm": 0.49186119929950545,
"learning_rate": 1.4360372108444125e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26581743359565735,
"step": 5800,
"valid_targets_mean": 3358.6,
"valid_targets_min": 357
},
{
"epoch": 4.4279176201373,
"grad_norm": 0.44575600794041736,
"learning_rate": 1.4323887519745916e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29282018542289734,
"step": 5805,
"valid_targets_mean": 4706.3,
"valid_targets_min": 1235
},
{
"epoch": 4.4317315026697175,
"grad_norm": 0.4183264646741452,
"learning_rate": 1.4287423463257063e-05,
"loss": 0.2844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26400482654571533,
"step": 5810,
"valid_targets_mean": 4878.5,
"valid_targets_min": 1455
},
{
"epoch": 4.435545385202135,
"grad_norm": 0.4731714728599063,
"learning_rate": 1.4250980070879055e-05,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2791379988193512,
"step": 5815,
"valid_targets_mean": 4437.2,
"valid_targets_min": 1131
},
{
"epoch": 4.439359267734554,
"grad_norm": 0.4733320793835799,
"learning_rate": 1.4214557474438619e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28043392300605774,
"step": 5820,
"valid_targets_mean": 4277.6,
"valid_targets_min": 1061
},
{
"epoch": 4.443173150266972,
"grad_norm": 0.45787589149165286,
"learning_rate": 1.4178155805687264e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3145343065261841,
"step": 5825,
"valid_targets_mean": 5004.2,
"valid_targets_min": 824
},
{
"epoch": 4.44698703279939,
"grad_norm": 0.426977376897121,
"learning_rate": 1.4141775196300796e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563020586967468,
"step": 5830,
"valid_targets_mean": 4465.5,
"valid_targets_min": 1218
},
{
"epoch": 4.450800915331808,
"grad_norm": 0.5159147361121579,
"learning_rate": 1.410541577787884e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24296748638153076,
"step": 5835,
"valid_targets_mean": 4424.7,
"valid_targets_min": 523
},
{
"epoch": 4.454614797864226,
"grad_norm": 0.4422629941501212,
"learning_rate": 1.406907768194437e-05,
"loss": 0.2689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2830718755722046,
"step": 5840,
"valid_targets_mean": 4799.2,
"valid_targets_min": 472
},
{
"epoch": 4.4584286803966435,
"grad_norm": 0.4616483695107263,
"learning_rate": 1.4032761039943232e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.323681503534317,
"step": 5845,
"valid_targets_mean": 4502.0,
"valid_targets_min": 1044
},
{
"epoch": 4.462242562929061,
"grad_norm": 0.44725678549137443,
"learning_rate": 1.3996465983243663e-05,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2807271480560303,
"step": 5850,
"valid_targets_mean": 4554.4,
"valid_targets_min": 836
},
{
"epoch": 4.46605644546148,
"grad_norm": 0.4593516328145645,
"learning_rate": 1.3960192643135817e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010134696960449,
"step": 5855,
"valid_targets_mean": 4276.0,
"valid_targets_min": 537
},
{
"epoch": 4.469870327993898,
"grad_norm": 0.48968025049502933,
"learning_rate": 1.3923941150831304e-05,
"loss": 0.2885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2574882507324219,
"step": 5860,
"valid_targets_mean": 4256.4,
"valid_targets_min": 1127
},
{
"epoch": 4.473684210526316,
"grad_norm": 0.45205623140214196,
"learning_rate": 1.3887711637462692e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29931384325027466,
"step": 5865,
"valid_targets_mean": 4524.5,
"valid_targets_min": 1240
},
{
"epoch": 4.477498093058734,
"grad_norm": 0.4363509333460341,
"learning_rate": 1.385150423408305e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23655830323696136,
"step": 5870,
"valid_targets_mean": 4474.1,
"valid_targets_min": 414
},
{
"epoch": 4.481311975591152,
"grad_norm": 0.4299324110154981,
"learning_rate": 1.3815319071665465e-05,
"loss": 0.2973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2632123529911041,
"step": 5875,
"valid_targets_mean": 4886.5,
"valid_targets_min": 531
},
{
"epoch": 4.48512585812357,
"grad_norm": 0.5194009105360434,
"learning_rate": 1.3779156281102574e-05,
"loss": 0.264,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27804139256477356,
"step": 5880,
"valid_targets_mean": 3514.6,
"valid_targets_min": 417
},
{
"epoch": 4.488939740655987,
"grad_norm": 0.6032698548453926,
"learning_rate": 1.3743015993206092e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2937086522579193,
"step": 5885,
"valid_targets_mean": 3735.5,
"valid_targets_min": 728
},
{
"epoch": 4.492753623188406,
"grad_norm": 0.43407844015473207,
"learning_rate": 1.3706898338706328e-05,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27821847796440125,
"step": 5890,
"valid_targets_mean": 4741.5,
"valid_targets_min": 1018
},
{
"epoch": 4.496567505720824,
"grad_norm": 1.5044846660486753,
"learning_rate": 1.3670803448251724e-05,
"loss": 0.3162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5219283103942871,
"step": 5895,
"valid_targets_mean": 787.7,
"valid_targets_min": 432
},
{
"epoch": 4.500381388253242,
"grad_norm": 0.4767872042750548,
"learning_rate": 1.3634731452408373e-05,
"loss": 0.4027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30305016040802,
"step": 5900,
"valid_targets_mean": 4886.7,
"valid_targets_min": 1604
},
{
"epoch": 4.50419527078566,
"grad_norm": 0.45889438457,
"learning_rate": 1.3598682481659556e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751183807849884,
"step": 5905,
"valid_targets_mean": 4272.3,
"valid_targets_min": 1270
},
{
"epoch": 4.508009153318078,
"grad_norm": 0.5049581257103946,
"learning_rate": 1.3562656666405268e-05,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787635028362274,
"step": 5910,
"valid_targets_mean": 4410.7,
"valid_targets_min": 1023
},
{
"epoch": 4.511823035850496,
"grad_norm": 0.47197243732827343,
"learning_rate": 1.3526654136961734e-05,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2548222839832306,
"step": 5915,
"valid_targets_mean": 3748.5,
"valid_targets_min": 1234
},
{
"epoch": 4.5156369183829135,
"grad_norm": 0.531002042605842,
"learning_rate": 1.3490675023560958e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27940547466278076,
"step": 5920,
"valid_targets_mean": 3234.5,
"valid_targets_min": 842
},
{
"epoch": 4.519450800915331,
"grad_norm": 0.42608539048001653,
"learning_rate": 1.3454719456350227e-05,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2519294321537018,
"step": 5925,
"valid_targets_mean": 4580.6,
"valid_targets_min": 850
},
{
"epoch": 4.52326468344775,
"grad_norm": 0.4337057125152285,
"learning_rate": 1.341878756539167e-05,
"loss": 0.2886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535187005996704,
"step": 5930,
"valid_targets_mean": 4240.9,
"valid_targets_min": 896
},
{
"epoch": 4.527078565980168,
"grad_norm": 0.44211798863673996,
"learning_rate": 1.3382879480661764e-05,
"loss": 0.2782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28309544920921326,
"step": 5935,
"valid_targets_mean": 4592.7,
"valid_targets_min": 1101
},
{
"epoch": 4.530892448512586,
"grad_norm": 0.4310747429914301,
"learning_rate": 1.334699533205087e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27521029114723206,
"step": 5940,
"valid_targets_mean": 4518.3,
"valid_targets_min": 1287
},
{
"epoch": 4.534706331045004,
"grad_norm": 0.4439661875246889,
"learning_rate": 1.3311135249362765e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662383019924164,
"step": 5945,
"valid_targets_mean": 4220.8,
"valid_targets_min": 1279
},
{
"epoch": 4.538520213577422,
"grad_norm": 0.4158911308719578,
"learning_rate": 1.3275299362314183e-05,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26738566160202026,
"step": 5950,
"valid_targets_mean": 5363.2,
"valid_targets_min": 1796
},
{
"epoch": 4.5423340961098395,
"grad_norm": 0.5328998160967272,
"learning_rate": 1.323948780053432e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2578364610671997,
"step": 5955,
"valid_targets_mean": 3145.2,
"valid_targets_min": 948
},
{
"epoch": 4.546147978642258,
"grad_norm": 0.4627383344985359,
"learning_rate": 1.320370069356439e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3163941204547882,
"step": 5960,
"valid_targets_mean": 4478.6,
"valid_targets_min": 1010
},
{
"epoch": 4.549961861174676,
"grad_norm": 0.46521595739091043,
"learning_rate": 1.3167938170857144e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29799818992614746,
"step": 5965,
"valid_targets_mean": 4643.4,
"valid_targets_min": 1383
},
{
"epoch": 4.553775743707094,
"grad_norm": 0.46932508666922923,
"learning_rate": 1.3132200361776399e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25845086574554443,
"step": 5970,
"valid_targets_mean": 4063.8,
"valid_targets_min": 472
},
{
"epoch": 4.557589626239512,
"grad_norm": 0.49516638729280765,
"learning_rate": 1.3096487395596587e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26746347546577454,
"step": 5975,
"valid_targets_mean": 3572.2,
"valid_targets_min": 432
},
{
"epoch": 4.56140350877193,
"grad_norm": 0.48711071485037627,
"learning_rate": 1.3060799401502263e-05,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3077528774738312,
"step": 5980,
"valid_targets_mean": 4599.1,
"valid_targets_min": 1437
},
{
"epoch": 4.565217391304348,
"grad_norm": 0.483945859673428,
"learning_rate": 1.3025136508587659e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2518140375614166,
"step": 5985,
"valid_targets_mean": 3965.2,
"valid_targets_min": 1004
},
{
"epoch": 4.5690312738367655,
"grad_norm": 0.4719885943283488,
"learning_rate": 1.2989498845856201e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2801418602466583,
"step": 5990,
"valid_targets_mean": 3937.7,
"valid_targets_min": 1187
},
{
"epoch": 4.572845156369183,
"grad_norm": 0.42038699637659116,
"learning_rate": 1.2953886542220064e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2455323487520218,
"step": 5995,
"valid_targets_mean": 4707.3,
"valid_targets_min": 1049
},
{
"epoch": 4.576659038901602,
"grad_norm": 0.3969957514118753,
"learning_rate": 1.2918299726499676e-05,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27261656522750854,
"step": 6000,
"valid_targets_mean": 6213.8,
"valid_targets_min": 1807
},
{
"epoch": 4.58047292143402,
"grad_norm": 0.4541016921407842,
"learning_rate": 1.2882738527423278e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23699618875980377,
"step": 6005,
"valid_targets_mean": 3908.7,
"valid_targets_min": 1072
},
{
"epoch": 4.584286803966438,
"grad_norm": 0.43712584522591535,
"learning_rate": 1.2847203073626436e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29207512736320496,
"step": 6010,
"valid_targets_mean": 4578.5,
"valid_targets_min": 1249
},
{
"epoch": 4.588100686498856,
"grad_norm": 0.4478920451756276,
"learning_rate": 1.2811693493651602e-05,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22837209701538086,
"step": 6015,
"valid_targets_mean": 4246.5,
"valid_targets_min": 769
},
{
"epoch": 4.591914569031274,
"grad_norm": 0.4304258549375004,
"learning_rate": 1.2776209915947627e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726576030254364,
"step": 6020,
"valid_targets_mean": 4741.2,
"valid_targets_min": 1066
},
{
"epoch": 4.595728451563692,
"grad_norm": 0.4243229034746278,
"learning_rate": 1.27407524688693e-05,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22514188289642334,
"step": 6025,
"valid_targets_mean": 4388.4,
"valid_targets_min": 1254
},
{
"epoch": 4.5995423340961095,
"grad_norm": 0.4741565772839733,
"learning_rate": 1.2705321280676897e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31086888909339905,
"step": 6030,
"valid_targets_mean": 4512.9,
"valid_targets_min": 1289
},
{
"epoch": 4.603356216628528,
"grad_norm": 0.427168564883841,
"learning_rate": 1.2669916479535695e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28429481387138367,
"step": 6035,
"valid_targets_mean": 5438.9,
"valid_targets_min": 1283
},
{
"epoch": 4.607170099160946,
"grad_norm": 0.5386715627774374,
"learning_rate": 1.2634538193515544e-05,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24557559192180634,
"step": 6040,
"valid_targets_mean": 3304.1,
"valid_targets_min": 852
},
{
"epoch": 4.610983981693364,
"grad_norm": 0.46561727285996857,
"learning_rate": 1.2599186550590355e-05,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2816053628921509,
"step": 6045,
"valid_targets_mean": 4762.0,
"valid_targets_min": 1659
},
{
"epoch": 4.614797864225782,
"grad_norm": 0.4334778280310194,
"learning_rate": 1.2563861678637675e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26823705434799194,
"step": 6050,
"valid_targets_mean": 5187.0,
"valid_targets_min": 1099
},
{
"epoch": 4.6186117467582,
"grad_norm": 0.4621016055707872,
"learning_rate": 1.2528563705438215e-05,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28503915667533875,
"step": 6055,
"valid_targets_mean": 5040.2,
"valid_targets_min": 1316
},
{
"epoch": 4.622425629290618,
"grad_norm": 0.5982601990337268,
"learning_rate": 1.2493292758675379e-05,
"loss": 0.2891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2772160470485687,
"step": 6060,
"valid_targets_mean": 2937.5,
"valid_targets_min": 653
},
{
"epoch": 4.6262395118230355,
"grad_norm": 0.640637801864729,
"learning_rate": 1.245804896593481e-05,
"loss": 0.4612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3399999141693115,
"step": 6065,
"valid_targets_mean": 3138.5,
"valid_targets_min": 796
},
{
"epoch": 4.630053394355453,
"grad_norm": 0.480477869036594,
"learning_rate": 1.2422832454703925e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532704770565033,
"step": 6070,
"valid_targets_mean": 3822.2,
"valid_targets_min": 464
},
{
"epoch": 4.633867276887872,
"grad_norm": 0.5193519065919779,
"learning_rate": 1.2387643352371458e-05,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27806735038757324,
"step": 6075,
"valid_targets_mean": 3533.6,
"valid_targets_min": 1167
},
{
"epoch": 4.63768115942029,
"grad_norm": 0.45415550206324007,
"learning_rate": 1.2352481786227002e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2920186221599579,
"step": 6080,
"valid_targets_mean": 5147.2,
"valid_targets_min": 1086
},
{
"epoch": 4.641495041952708,
"grad_norm": 0.4516307494153642,
"learning_rate": 1.2317347883460533e-05,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2339109182357788,
"step": 6085,
"valid_targets_mean": 4068.7,
"valid_targets_min": 1158
},
{
"epoch": 4.645308924485126,
"grad_norm": 0.533201480795766,
"learning_rate": 1.228224177116197e-05,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30167070031166077,
"step": 6090,
"valid_targets_mean": 4061.7,
"valid_targets_min": 580
},
{
"epoch": 4.649122807017544,
"grad_norm": 0.44208307954025483,
"learning_rate": 1.2247163576320691e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26982858777046204,
"step": 6095,
"valid_targets_mean": 4680.1,
"valid_targets_min": 1126
},
{
"epoch": 4.6529366895499615,
"grad_norm": 0.4684962063196071,
"learning_rate": 1.2212113425825108e-05,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2656426727771759,
"step": 6100,
"valid_targets_mean": 4013.8,
"valid_targets_min": 1228
},
{
"epoch": 4.65675057208238,
"grad_norm": 0.4704971087227113,
"learning_rate": 1.2177091446462165e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2484935075044632,
"step": 6105,
"valid_targets_mean": 4056.9,
"valid_targets_min": 1235
},
{
"epoch": 4.660564454614798,
"grad_norm": 0.4793308933230215,
"learning_rate": 1.2142097764916932e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27687665820121765,
"step": 6110,
"valid_targets_mean": 4041.4,
"valid_targets_min": 1256
},
{
"epoch": 4.664378337147216,
"grad_norm": 0.430844114668902,
"learning_rate": 1.210713250777209e-05,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678356170654297,
"step": 6115,
"valid_targets_mean": 5247.5,
"valid_targets_min": 1208
},
{
"epoch": 4.668192219679634,
"grad_norm": 0.4610368968711122,
"learning_rate": 1.2072195801507514e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27113208174705505,
"step": 6120,
"valid_targets_mean": 3816.7,
"valid_targets_min": 979
},
{
"epoch": 4.672006102212052,
"grad_norm": 0.4783363189865354,
"learning_rate": 1.20372877724998e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22927595674991608,
"step": 6125,
"valid_targets_mean": 3613.3,
"valid_targets_min": 880
},
{
"epoch": 4.67581998474447,
"grad_norm": 0.4437246147947317,
"learning_rate": 1.2002408547021806e-05,
"loss": 0.2743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23522575199604034,
"step": 6130,
"valid_targets_mean": 5034.9,
"valid_targets_min": 985
},
{
"epoch": 4.679633867276888,
"grad_norm": 0.4123331439857932,
"learning_rate": 1.1967558251242202e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2195393294095993,
"step": 6135,
"valid_targets_mean": 4580.7,
"valid_targets_min": 1199
},
{
"epoch": 4.6834477498093054,
"grad_norm": 0.48821062186968395,
"learning_rate": 1.193273701122501e-05,
"loss": 0.2808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29080095887184143,
"step": 6140,
"valid_targets_mean": 3972.9,
"valid_targets_min": 617
},
{
"epoch": 4.687261632341724,
"grad_norm": 0.46089074530910856,
"learning_rate": 1.1897944952929147e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29182562232017517,
"step": 6145,
"valid_targets_mean": 4697.0,
"valid_targets_min": 829
},
{
"epoch": 4.691075514874142,
"grad_norm": 0.5337402462436025,
"learning_rate": 1.1863182202207977e-05,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26698315143585205,
"step": 6150,
"valid_targets_mean": 3188.3,
"valid_targets_min": 453
},
{
"epoch": 4.69488939740656,
"grad_norm": 0.39887817966067385,
"learning_rate": 1.1828448884808843e-05,
"loss": 0.2541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23282591998577118,
"step": 6155,
"valid_targets_mean": 5004.8,
"valid_targets_min": 1170
},
{
"epoch": 4.698703279938978,
"grad_norm": 0.44218313890919614,
"learning_rate": 1.1793745126372621e-05,
"loss": 0.2784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869015634059906,
"step": 6160,
"valid_targets_mean": 4819.4,
"valid_targets_min": 1478
},
{
"epoch": 4.702517162471396,
"grad_norm": 0.4671992817834822,
"learning_rate": 1.1759071052433267e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.259736031293869,
"step": 6165,
"valid_targets_mean": 4065.2,
"valid_targets_min": 436
},
{
"epoch": 4.706331045003814,
"grad_norm": 0.4158893122333823,
"learning_rate": 1.1724426788417348e-05,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3164721131324768,
"step": 6170,
"valid_targets_mean": 5909.0,
"valid_targets_min": 789
},
{
"epoch": 4.710144927536232,
"grad_norm": 0.44964144254203897,
"learning_rate": 1.1689812459643612e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597438395023346,
"step": 6175,
"valid_targets_mean": 4044.4,
"valid_targets_min": 934
},
{
"epoch": 4.71395881006865,
"grad_norm": 0.4621900769426731,
"learning_rate": 1.1655228191322511e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24745304882526398,
"step": 6180,
"valid_targets_mean": 4173.3,
"valid_targets_min": 1173
},
{
"epoch": 4.717772692601068,
"grad_norm": 0.5019089891367999,
"learning_rate": 1.1620674108555786e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863067090511322,
"step": 6185,
"valid_targets_mean": 4092.0,
"valid_targets_min": 1843
},
{
"epoch": 4.721586575133486,
"grad_norm": 0.5402156848005659,
"learning_rate": 1.1586150336335937e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19477152824401855,
"step": 6190,
"valid_targets_mean": 4124.9,
"valid_targets_min": 993
},
{
"epoch": 4.725400457665904,
"grad_norm": 0.45180783666601976,
"learning_rate": 1.1551656999545879e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2611711919307709,
"step": 6195,
"valid_targets_mean": 4767.4,
"valid_targets_min": 1080
},
{
"epoch": 4.729214340198322,
"grad_norm": 0.43472107197938675,
"learning_rate": 1.1517194222958385e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2774430811405182,
"step": 6200,
"valid_targets_mean": 4779.7,
"valid_targets_min": 1768
},
{
"epoch": 4.73302822273074,
"grad_norm": 0.4131997148781024,
"learning_rate": 1.1482762131235723e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2677346169948578,
"step": 6205,
"valid_targets_mean": 5425.2,
"valid_targets_min": 1425
},
{
"epoch": 4.7368421052631575,
"grad_norm": 0.4767133309486682,
"learning_rate": 1.1448360848929125e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2785078287124634,
"step": 6210,
"valid_targets_mean": 3975.9,
"valid_targets_min": 680
},
{
"epoch": 4.740655987795575,
"grad_norm": 0.47301915164428615,
"learning_rate": 1.1413990500478404e-05,
"loss": 0.2756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25078871846199036,
"step": 6215,
"valid_targets_mean": 4398.8,
"valid_targets_min": 1321
},
{
"epoch": 4.744469870327994,
"grad_norm": 0.48680450680333354,
"learning_rate": 1.1379651210211482e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23261241614818573,
"step": 6220,
"valid_targets_mean": 3989.0,
"valid_targets_min": 863
},
{
"epoch": 4.748283752860412,
"grad_norm": 0.42575127016998615,
"learning_rate": 1.1345343102343898e-05,
"loss": 0.2751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24395425617694855,
"step": 6225,
"valid_targets_mean": 4580.4,
"valid_targets_min": 1255
},
{
"epoch": 4.75209763539283,
"grad_norm": 0.5622398324565753,
"learning_rate": 1.1311066300978438e-05,
"loss": 0.4105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28262239694595337,
"step": 6230,
"valid_targets_mean": 2832.5,
"valid_targets_min": 620
},
{
"epoch": 4.755911517925248,
"grad_norm": 0.48839896275848155,
"learning_rate": 1.1276820930104599e-05,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2837162911891937,
"step": 6235,
"valid_targets_mean": 4031.0,
"valid_targets_min": 1314
},
{
"epoch": 4.759725400457666,
"grad_norm": 0.4469933360053575,
"learning_rate": 1.1242607113598227e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2282828837633133,
"step": 6240,
"valid_targets_mean": 4210.8,
"valid_targets_min": 617
},
{
"epoch": 4.763539282990084,
"grad_norm": 0.4459250961437655,
"learning_rate": 1.1208424975220992e-05,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26507505774497986,
"step": 6245,
"valid_targets_mean": 4829.0,
"valid_targets_min": 867
},
{
"epoch": 4.767353165522502,
"grad_norm": 0.44761512621995236,
"learning_rate": 1.1174274638620006e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2591985762119293,
"step": 6250,
"valid_targets_mean": 5047.7,
"valid_targets_min": 1386
},
{
"epoch": 4.77116704805492,
"grad_norm": 0.46003734262291296,
"learning_rate": 1.1140156227327312e-05,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24344348907470703,
"step": 6255,
"valid_targets_mean": 3709.6,
"valid_targets_min": 322
},
{
"epoch": 4.774980930587338,
"grad_norm": 0.4597165894813579,
"learning_rate": 1.110606986475949e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2670276463031769,
"step": 6260,
"valid_targets_mean": 4286.9,
"valid_targets_min": 995
},
{
"epoch": 4.778794813119756,
"grad_norm": 0.45709678873048865,
"learning_rate": 1.1072015674217195e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22857964038848877,
"step": 6265,
"valid_targets_mean": 4505.5,
"valid_targets_min": 1520
},
{
"epoch": 4.782608695652174,
"grad_norm": 0.47553977436663747,
"learning_rate": 1.1037993778884682e-05,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27654123306274414,
"step": 6270,
"valid_targets_mean": 4468.1,
"valid_targets_min": 1259
},
{
"epoch": 4.786422578184592,
"grad_norm": 0.4349786674742026,
"learning_rate": 1.1004004301829414e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25767046213150024,
"step": 6275,
"valid_targets_mean": 4472.5,
"valid_targets_min": 429
},
{
"epoch": 4.79023646071701,
"grad_norm": 0.4028363610927219,
"learning_rate": 1.0970047366001554e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23868699371814728,
"step": 6280,
"valid_targets_mean": 4960.5,
"valid_targets_min": 855
},
{
"epoch": 4.7940503432494275,
"grad_norm": 0.48133951454517454,
"learning_rate": 1.0936123094233593e-05,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29551172256469727,
"step": 6285,
"valid_targets_mean": 4206.8,
"valid_targets_min": 696
},
{
"epoch": 4.797864225781846,
"grad_norm": 0.5032080776134414,
"learning_rate": 1.0902231609239827e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717246115207672,
"step": 6290,
"valid_targets_mean": 3735.2,
"valid_targets_min": 1154
},
{
"epoch": 4.801678108314264,
"grad_norm": 0.47775196462942643,
"learning_rate": 1.0868373033615982e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23652702569961548,
"step": 6295,
"valid_targets_mean": 4304.8,
"valid_targets_min": 1440
},
{
"epoch": 4.805491990846682,
"grad_norm": 0.4450270865034603,
"learning_rate": 1.0834547489838721e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2865585386753082,
"step": 6300,
"valid_targets_mean": 5426.2,
"valid_targets_min": 1185
},
{
"epoch": 4.8093058733791,
"grad_norm": 0.591606504521793,
"learning_rate": 1.0800755100265232e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531816363334656,
"step": 6305,
"valid_targets_mean": 3974.3,
"valid_targets_min": 971
},
{
"epoch": 4.813119755911518,
"grad_norm": 0.46299858012511447,
"learning_rate": 1.076699598713278e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25391659140586853,
"step": 6310,
"valid_targets_mean": 4571.8,
"valid_targets_min": 993
},
{
"epoch": 4.816933638443936,
"grad_norm": 0.43866444790079595,
"learning_rate": 1.0733270272558239e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2802743911743164,
"step": 6315,
"valid_targets_mean": 4542.2,
"valid_targets_min": 244
},
{
"epoch": 4.820747520976354,
"grad_norm": 0.4551570589007343,
"learning_rate": 1.0699578078537694e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2353227138519287,
"step": 6320,
"valid_targets_mean": 4614.6,
"valid_targets_min": 2119
},
{
"epoch": 4.824561403508772,
"grad_norm": 0.4701677190514475,
"learning_rate": 1.0665919526945947e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597653567790985,
"step": 6325,
"valid_targets_mean": 4287.8,
"valid_targets_min": 1232
},
{
"epoch": 4.82837528604119,
"grad_norm": 0.45065967973941917,
"learning_rate": 1.0632294739536142e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26184967160224915,
"step": 6330,
"valid_targets_mean": 4189.0,
"valid_targets_min": 317
},
{
"epoch": 4.832189168573608,
"grad_norm": 0.4491956885125322,
"learning_rate": 1.0598703837939248e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26985234022140503,
"step": 6335,
"valid_targets_mean": 4688.4,
"valid_targets_min": 1051
},
{
"epoch": 4.836003051106026,
"grad_norm": 0.47402852666197354,
"learning_rate": 1.05651469436637e-05,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23498666286468506,
"step": 6340,
"valid_targets_mean": 5051.1,
"valid_targets_min": 1277
},
{
"epoch": 4.839816933638444,
"grad_norm": 0.5845640550501232,
"learning_rate": 1.0531624178094879e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2578241229057312,
"step": 6345,
"valid_targets_mean": 2851.9,
"valid_targets_min": 488
},
{
"epoch": 4.843630816170862,
"grad_norm": 0.4405871777300844,
"learning_rate": 1.0498135662494735e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27082574367523193,
"step": 6350,
"valid_targets_mean": 5172.5,
"valid_targets_min": 728
},
{
"epoch": 4.8474446987032795,
"grad_norm": 0.4078096120879491,
"learning_rate": 1.046468151800133e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26433292031288147,
"step": 6355,
"valid_targets_mean": 5071.0,
"valid_targets_min": 518
},
{
"epoch": 4.851258581235698,
"grad_norm": 0.45556925639901935,
"learning_rate": 1.0431261865628373e-05,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3047320544719696,
"step": 6360,
"valid_targets_mean": 4966.4,
"valid_targets_min": 565
},
{
"epoch": 4.855072463768116,
"grad_norm": 0.45539843805802527,
"learning_rate": 1.0397876826264835e-05,
"loss": 0.2757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29343321919441223,
"step": 6365,
"valid_targets_mean": 5031.4,
"valid_targets_min": 389
},
{
"epoch": 4.858886346300534,
"grad_norm": 0.5174457675449293,
"learning_rate": 1.036452652067444e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2625400722026825,
"step": 6370,
"valid_targets_mean": 3652.8,
"valid_targets_min": 1119
},
{
"epoch": 4.862700228832952,
"grad_norm": 0.42023442456712606,
"learning_rate": 1.033121106949532e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27681344747543335,
"step": 6375,
"valid_targets_mean": 5527.3,
"valid_targets_min": 1281
},
{
"epoch": 4.86651411136537,
"grad_norm": 0.4745097765595684,
"learning_rate": 1.0297930593239483e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25876760482788086,
"step": 6380,
"valid_targets_mean": 3772.8,
"valid_targets_min": 609
},
{
"epoch": 4.870327993897788,
"grad_norm": 0.4452410560238349,
"learning_rate": 1.0264685212292443e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33578386902809143,
"step": 6385,
"valid_targets_mean": 4824.7,
"valid_targets_min": 966
},
{
"epoch": 4.874141876430206,
"grad_norm": 0.44239743286286903,
"learning_rate": 1.0231475046912771e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29823407530784607,
"step": 6390,
"valid_targets_mean": 5004.5,
"valid_targets_min": 1091
},
{
"epoch": 4.877955758962624,
"grad_norm": 0.5195950786044768,
"learning_rate": 1.0198300217231627e-05,
"loss": 0.4296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30986395478248596,
"step": 6395,
"valid_targets_mean": 4166.0,
"valid_targets_min": 580
},
{
"epoch": 4.881769641495042,
"grad_norm": 0.48620033251297656,
"learning_rate": 1.0165160843252388e-05,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24216914176940918,
"step": 6400,
"valid_targets_mean": 3795.1,
"valid_targets_min": 1023
},
{
"epoch": 4.88558352402746,
"grad_norm": 0.4409043094002218,
"learning_rate": 1.0132057044850137e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25296226143836975,
"step": 6405,
"valid_targets_mean": 4557.1,
"valid_targets_min": 1657
},
{
"epoch": 4.889397406559878,
"grad_norm": 0.4893275906184621,
"learning_rate": 1.0098988941771305e-05,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721904218196869,
"step": 6410,
"valid_targets_mean": 4337.0,
"valid_targets_min": 269
},
{
"epoch": 4.893211289092296,
"grad_norm": 0.473091196768073,
"learning_rate": 1.0065956653633173e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2775305509567261,
"step": 6415,
"valid_targets_mean": 4149.3,
"valid_targets_min": 1155
},
{
"epoch": 4.897025171624714,
"grad_norm": 0.4611208289628004,
"learning_rate": 1.0032960299923485e-05,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669666111469269,
"step": 6420,
"valid_targets_mean": 4127.0,
"valid_targets_min": 1402
},
{
"epoch": 4.900839054157132,
"grad_norm": 0.4446130762839984,
"learning_rate": 1.0000000000000006e-05,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863334119319916,
"step": 6425,
"valid_targets_mean": 5016.7,
"valid_targets_min": 1316
},
{
"epoch": 4.9046529366895495,
"grad_norm": 0.4631447759575701,
"learning_rate": 9.967075873090057e-06,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2800535559654236,
"step": 6430,
"valid_targets_mean": 4280.8,
"valid_targets_min": 351
},
{
"epoch": 4.908466819221968,
"grad_norm": 0.4866673735485943,
"learning_rate": 9.934188038290144e-06,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25013306736946106,
"step": 6435,
"valid_targets_mean": 3571.5,
"valid_targets_min": 1055
},
{
"epoch": 4.912280701754386,
"grad_norm": 0.5676709320301305,
"learning_rate": 9.90133661456546e-06,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3177274763584137,
"step": 6440,
"valid_targets_mean": 4374.2,
"valid_targets_min": 1454
},
{
"epoch": 4.916094584286804,
"grad_norm": 0.474411723432594,
"learning_rate": 9.86852172074952e-06,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2783035933971405,
"step": 6445,
"valid_targets_mean": 3933.2,
"valid_targets_min": 1212
},
{
"epoch": 4.919908466819222,
"grad_norm": 0.4310577771224861,
"learning_rate": 9.835743475543669e-06,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25968584418296814,
"step": 6450,
"valid_targets_mean": 4817.0,
"valid_targets_min": 1630
},
{
"epoch": 4.92372234935164,
"grad_norm": 0.4256333701579665,
"learning_rate": 9.80300199751671e-06,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2685914933681488,
"step": 6455,
"valid_targets_mean": 5068.5,
"valid_targets_min": 1395
},
{
"epoch": 4.927536231884058,
"grad_norm": 0.4020917325980264,
"learning_rate": 9.770297405104426e-06,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2310306578874588,
"step": 6460,
"valid_targets_mean": 5008.4,
"valid_targets_min": 1203
},
{
"epoch": 4.931350114416476,
"grad_norm": 0.424080030882146,
"learning_rate": 9.737629816609186e-06,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726290225982666,
"step": 6465,
"valid_targets_mean": 5150.7,
"valid_targets_min": 280
},
{
"epoch": 4.935163996948894,
"grad_norm": 0.5078040027460309,
"learning_rate": 9.704999350199512e-06,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22907471656799316,
"step": 6470,
"valid_targets_mean": 3427.7,
"valid_targets_min": 456
},
{
"epoch": 4.938977879481312,
"grad_norm": 0.47313149739798094,
"learning_rate": 9.672406123909621e-06,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26523223519325256,
"step": 6475,
"valid_targets_mean": 4480.9,
"valid_targets_min": 480
},
{
"epoch": 4.94279176201373,
"grad_norm": 0.612986995052608,
"learning_rate": 9.639850255639047e-06,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3095862865447998,
"step": 6480,
"valid_targets_mean": 4458.4,
"valid_targets_min": 1012
},
{
"epoch": 4.946605644546148,
"grad_norm": 0.4697376419383409,
"learning_rate": 9.60733186315216e-06,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2794733941555023,
"step": 6485,
"valid_targets_mean": 4355.2,
"valid_targets_min": 1178
},
{
"epoch": 4.950419527078566,
"grad_norm": 0.4347464188066338,
"learning_rate": 9.574851064077805e-06,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26758232712745667,
"step": 6490,
"valid_targets_mean": 5047.6,
"valid_targets_min": 1477
},
{
"epoch": 4.954233409610984,
"grad_norm": 0.4523891272435883,
"learning_rate": 9.542407975908801e-06,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2836798131465912,
"step": 6495,
"valid_targets_mean": 4667.2,
"valid_targets_min": 941
},
{
"epoch": 4.958047292143402,
"grad_norm": 0.4439635451916094,
"learning_rate": 9.510002716001591e-06,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.291238009929657,
"step": 6500,
"valid_targets_mean": 5885.6,
"valid_targets_min": 1412
},
{
"epoch": 4.96186117467582,
"grad_norm": 0.5153040180095564,
"learning_rate": 9.477635401575752e-06,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24549072980880737,
"step": 6505,
"valid_targets_mean": 3759.1,
"valid_targets_min": 986
},
{
"epoch": 4.965675057208238,
"grad_norm": 0.5275444608815067,
"learning_rate": 9.44530614971362e-06,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27426838874816895,
"step": 6510,
"valid_targets_mean": 3683.1,
"valid_targets_min": 948
},
{
"epoch": 4.969488939740656,
"grad_norm": 0.441657014255363,
"learning_rate": 9.41301507735985e-06,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29648175835609436,
"step": 6515,
"valid_targets_mean": 4722.1,
"valid_targets_min": 1067
},
{
"epoch": 4.973302822273074,
"grad_norm": 0.4116526665237431,
"learning_rate": 9.380762301320964e-06,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2626621425151825,
"step": 6520,
"valid_targets_mean": 5578.3,
"valid_targets_min": 833
},
{
"epoch": 4.977116704805492,
"grad_norm": 0.45738516459947337,
"learning_rate": 9.348547938264993e-06,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26601141691207886,
"step": 6525,
"valid_targets_mean": 4418.0,
"valid_targets_min": 951
},
{
"epoch": 4.98093058733791,
"grad_norm": 0.43957493723393576,
"learning_rate": 9.316372104720978e-06,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2962207794189453,
"step": 6530,
"valid_targets_mean": 5003.0,
"valid_targets_min": 1026
},
{
"epoch": 4.9847444698703285,
"grad_norm": 0.4406600914628833,
"learning_rate": 9.284234917078618e-06,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27836713194847107,
"step": 6535,
"valid_targets_mean": 4530.5,
"valid_targets_min": 363
},
{
"epoch": 4.988558352402746,
"grad_norm": 0.4929584772121223,
"learning_rate": 9.252136491587796e-06,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30669355392456055,
"step": 6540,
"valid_targets_mean": 4779.3,
"valid_targets_min": 855
},
{
"epoch": 4.992372234935164,
"grad_norm": 0.45919666024271943,
"learning_rate": 9.220076944358198e-06,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2921316623687744,
"step": 6545,
"valid_targets_mean": 4566.1,
"valid_targets_min": 993
},
{
"epoch": 4.996186117467582,
"grad_norm": 0.496912636598731,
"learning_rate": 9.188056391358857e-06,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33465495705604553,
"step": 6550,
"valid_targets_mean": 4712.3,
"valid_targets_min": 1218
},
{
"epoch": 5.0,
"grad_norm": 1.4334764781852514,
"learning_rate": 9.15607494841777e-06,
"loss": 0.4533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4589976370334625,
"step": 6555,
"valid_targets_mean": 858.8,
"valid_targets_min": 497
},
{
"epoch": 5.003813882532418,
"grad_norm": 0.4637236359062967,
"learning_rate": 9.12413273122146e-06,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30440065264701843,
"step": 6560,
"valid_targets_mean": 5229.4,
"valid_targets_min": 1152
},
{
"epoch": 5.007627765064836,
"grad_norm": 0.5731758576495917,
"learning_rate": 9.092229855314541e-06,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34112057089805603,
"step": 6565,
"valid_targets_mean": 3283.0,
"valid_targets_min": 660
},
{
"epoch": 5.011441647597254,
"grad_norm": 0.46800535106530056,
"learning_rate": 9.060366436099337e-06,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606760263442993,
"step": 6570,
"valid_targets_mean": 4470.2,
"valid_targets_min": 1025
},
{
"epoch": 5.015255530129672,
"grad_norm": 0.6137644660052498,
"learning_rate": 9.02854258883543e-06,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2700829803943634,
"step": 6575,
"valid_targets_mean": 4210.0,
"valid_targets_min": 345
},
{
"epoch": 5.01906941266209,
"grad_norm": 0.4878235171922639,
"learning_rate": 8.996758428639276e-06,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2577427923679352,
"step": 6580,
"valid_targets_mean": 4130.4,
"valid_targets_min": 1404
},
{
"epoch": 5.022883295194508,
"grad_norm": 0.4751599864581177,
"learning_rate": 8.965014070483749e-06,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24149303138256073,
"step": 6585,
"valid_targets_mean": 3961.3,
"valid_targets_min": 1118
},
{
"epoch": 5.026697177726926,
"grad_norm": 0.4592892732948017,
"learning_rate": 8.933309629197773e-06,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2872866988182068,
"step": 6590,
"valid_targets_mean": 4570.6,
"valid_targets_min": 782
},
{
"epoch": 5.030511060259344,
"grad_norm": 0.4243811711385429,
"learning_rate": 8.901645219465848e-06,
"loss": 0.2914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2821787893772125,
"step": 6595,
"valid_targets_mean": 4959.4,
"valid_targets_min": 1531
},
{
"epoch": 5.034324942791762,
"grad_norm": 0.40234791333162984,
"learning_rate": 8.870020955827697e-06,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24314086139202118,
"step": 6600,
"valid_targets_mean": 4961.0,
"valid_targets_min": 1151
},
{
"epoch": 5.03813882532418,
"grad_norm": 0.47734966546802016,
"learning_rate": 8.838436952677819e-06,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2361879199743271,
"step": 6605,
"valid_targets_mean": 3586.6,
"valid_targets_min": 449
},
{
"epoch": 5.041952707856598,
"grad_norm": 0.49430140990989624,
"learning_rate": 8.806893324265055e-06,
"loss": 0.2775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3115706145763397,
"step": 6610,
"valid_targets_mean": 4680.6,
"valid_targets_min": 1299
},
{
"epoch": 5.045766590389016,
"grad_norm": 0.455707973439489,
"learning_rate": 8.775390184692232e-06,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26760897040367126,
"step": 6615,
"valid_targets_mean": 4604.5,
"valid_targets_min": 833
},
{
"epoch": 5.049580472921434,
"grad_norm": 0.5010384461705412,
"learning_rate": 8.74392764791568e-06,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2379763126373291,
"step": 6620,
"valid_targets_mean": 3717.8,
"valid_targets_min": 301
},
{
"epoch": 5.053394355453852,
"grad_norm": 0.5298371448753371,
"learning_rate": 8.712505827744898e-06,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3061905801296234,
"step": 6625,
"valid_targets_mean": 3829.6,
"valid_targets_min": 1278
},
{
"epoch": 5.05720823798627,
"grad_norm": 0.4453159473628936,
"learning_rate": 8.681124837842057e-06,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2787354290485382,
"step": 6630,
"valid_targets_mean": 5117.9,
"valid_targets_min": 938
},
{
"epoch": 5.061022120518688,
"grad_norm": 0.47857296510039227,
"learning_rate": 8.64978479172167e-06,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26554688811302185,
"step": 6635,
"valid_targets_mean": 4001.0,
"valid_targets_min": 768
},
{
"epoch": 5.064836003051106,
"grad_norm": 0.46676260966328054,
"learning_rate": 8.618485802750119e-06,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28517279028892517,
"step": 6640,
"valid_targets_mean": 4640.2,
"valid_targets_min": 956
},
{
"epoch": 5.068649885583524,
"grad_norm": 0.47928071968710284,
"learning_rate": 8.58722798414528e-06,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27151843905448914,
"step": 6645,
"valid_targets_mean": 4000.2,
"valid_targets_min": 1232
},
{
"epoch": 5.072463768115942,
"grad_norm": 0.4471785238558857,
"learning_rate": 8.556011448976111e-06,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25223401188850403,
"step": 6650,
"valid_targets_mean": 4390.5,
"valid_targets_min": 659
},
{
"epoch": 5.07627765064836,
"grad_norm": 0.4668781382048033,
"learning_rate": 8.524836310162217e-06,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2625182271003723,
"step": 6655,
"valid_targets_mean": 4160.7,
"valid_targets_min": 972
},
{
"epoch": 5.080091533180778,
"grad_norm": 0.497840738820478,
"learning_rate": 8.493702680473481e-06,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22448588907718658,
"step": 6660,
"valid_targets_mean": 3680.2,
"valid_targets_min": 1247
},
{
"epoch": 5.083905415713196,
"grad_norm": 0.48363425185296266,
"learning_rate": 8.462610672529608e-06,
"loss": 0.275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23800963163375854,
"step": 6665,
"valid_targets_mean": 4145.7,
"valid_targets_min": 1149
},
{
"epoch": 5.087719298245614,
"grad_norm": 0.447347355895507,
"learning_rate": 8.431560398799779e-06,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2579364478588104,
"step": 6670,
"valid_targets_mean": 4632.5,
"valid_targets_min": 1081
},
{
"epoch": 5.091533180778032,
"grad_norm": 0.4394024565255274,
"learning_rate": 8.400551971602171e-06,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27306821942329407,
"step": 6675,
"valid_targets_mean": 4924.3,
"valid_targets_min": 1112
},
{
"epoch": 5.09534706331045,
"grad_norm": 0.41078294685140615,
"learning_rate": 8.369585503103628e-06,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21968694031238556,
"step": 6680,
"valid_targets_mean": 4687.0,
"valid_targets_min": 1765
},
{
"epoch": 5.099160945842868,
"grad_norm": 0.4286895396734995,
"learning_rate": 8.338661105319186e-06,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512158751487732,
"step": 6685,
"valid_targets_mean": 4783.9,
"valid_targets_min": 872
},
{
"epoch": 5.102974828375286,
"grad_norm": 0.4346920938094104,
"learning_rate": 8.30777889011172e-06,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605276107788086,
"step": 6690,
"valid_targets_mean": 4795.2,
"valid_targets_min": 1039
},
{
"epoch": 5.106788710907704,
"grad_norm": 0.44722763124062953,
"learning_rate": 8.276938969191506e-06,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29144763946533203,
"step": 6695,
"valid_targets_mean": 5161.2,
"valid_targets_min": 1295
},
{
"epoch": 5.110602593440122,
"grad_norm": 0.46646851736725947,
"learning_rate": 8.246141454115821e-06,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22032219171524048,
"step": 6700,
"valid_targets_mean": 3884.6,
"valid_targets_min": 1002
},
{
"epoch": 5.11441647597254,
"grad_norm": 0.5070689669662287,
"learning_rate": 8.215386456288576e-06,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27866432070732117,
"step": 6705,
"valid_targets_mean": 4045.0,
"valid_targets_min": 1020
},
{
"epoch": 5.118230358504958,
"grad_norm": 0.9995311563170907,
"learning_rate": 8.18467408695985e-06,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2413589358329773,
"step": 6710,
"valid_targets_mean": 4955.4,
"valid_targets_min": 1056
},
{
"epoch": 5.122044241037376,
"grad_norm": 0.40195021820199256,
"learning_rate": 8.154004457225547e-06,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23771731555461884,
"step": 6715,
"valid_targets_mean": 4887.3,
"valid_targets_min": 1317
},
{
"epoch": 5.125858123569794,
"grad_norm": 0.4960976441570362,
"learning_rate": 8.123377678026962e-06,
"loss": 0.4059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26147928833961487,
"step": 6720,
"valid_targets_mean": 3697.1,
"valid_targets_min": 433
},
{
"epoch": 5.129672006102212,
"grad_norm": 0.4880702087976833,
"learning_rate": 8.092793860150376e-06,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27091705799102783,
"step": 6725,
"valid_targets_mean": 4247.1,
"valid_targets_min": 939
},
{
"epoch": 5.13348588863463,
"grad_norm": 0.4984676713106216,
"learning_rate": 8.062253114226688e-06,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24456210434436798,
"step": 6730,
"valid_targets_mean": 3648.6,
"valid_targets_min": 1373
},
{
"epoch": 5.137299771167048,
"grad_norm": 0.4626797380175307,
"learning_rate": 8.031755550730966e-06,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22191393375396729,
"step": 6735,
"valid_targets_mean": 3943.0,
"valid_targets_min": 990
},
{
"epoch": 5.141113653699466,
"grad_norm": 0.4684925381564363,
"learning_rate": 8.0013012799821e-06,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535335123538971,
"step": 6740,
"valid_targets_mean": 4291.0,
"valid_targets_min": 1033
},
{
"epoch": 5.144927536231884,
"grad_norm": 0.5231522942873892,
"learning_rate": 7.970890412142349e-06,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535442113876343,
"step": 6745,
"valid_targets_mean": 3662.4,
"valid_targets_min": 874
},
{
"epoch": 5.148741418764302,
"grad_norm": 0.47740089425599175,
"learning_rate": 7.940523057217007e-06,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27571263909339905,
"step": 6750,
"valid_targets_mean": 4590.5,
"valid_targets_min": 934
},
{
"epoch": 5.1525553012967205,
"grad_norm": 0.4694998058736014,
"learning_rate": 7.910199325053926e-06,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29670730233192444,
"step": 6755,
"valid_targets_mean": 5085.7,
"valid_targets_min": 1068
},
{
"epoch": 5.156369183829138,
"grad_norm": 0.5035311411179674,
"learning_rate": 7.879919325343198e-06,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24500465393066406,
"step": 6760,
"valid_targets_mean": 3302.5,
"valid_targets_min": 1013
},
{
"epoch": 5.160183066361556,
"grad_norm": 0.47053806545490146,
"learning_rate": 7.849683167616706e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26875197887420654,
"step": 6765,
"valid_targets_mean": 4434.8,
"valid_targets_min": 1002
},
{
"epoch": 5.163996948893974,
"grad_norm": 0.47086093470609763,
"learning_rate": 7.819490961247738e-06,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2104368805885315,
"step": 6770,
"valid_targets_mean": 3852.2,
"valid_targets_min": 870
},
{
"epoch": 5.167810831426392,
"grad_norm": 0.4278205498892171,
"learning_rate": 7.789342815450614e-06,
"loss": 0.2811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29282939434051514,
"step": 6775,
"valid_targets_mean": 6059.0,
"valid_targets_min": 865
},
{
"epoch": 5.17162471395881,
"grad_norm": 0.4634629507302458,
"learning_rate": 7.759238839280245e-06,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2758885324001312,
"step": 6780,
"valid_targets_mean": 4304.7,
"valid_targets_min": 890
},
{
"epoch": 5.175438596491228,
"grad_norm": 0.45836552925576557,
"learning_rate": 7.729179141631804e-06,
"loss": 0.2558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2779264450073242,
"step": 6785,
"valid_targets_mean": 5225.0,
"valid_targets_min": 1847
},
{
"epoch": 5.1792524790236465,
"grad_norm": 0.438575576795386,
"learning_rate": 7.69916383124026e-06,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508902847766876,
"step": 6790,
"valid_targets_mean": 5232.6,
"valid_targets_min": 1525
},
{
"epoch": 5.183066361556064,
"grad_norm": 0.4523443599950125,
"learning_rate": 7.669193016680049e-06,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792450189590454,
"step": 6795,
"valid_targets_mean": 4931.0,
"valid_targets_min": 1398
},
{
"epoch": 5.186880244088482,
"grad_norm": 0.5896330188216606,
"learning_rate": 7.639266806364627e-06,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2727765738964081,
"step": 6800,
"valid_targets_mean": 4803.3,
"valid_targets_min": 787
},
{
"epoch": 5.1906941266209,
"grad_norm": 0.4007427104448006,
"learning_rate": 7.60938530854612e-06,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25615957379341125,
"step": 6805,
"valid_targets_mean": 5634.1,
"valid_targets_min": 1214
},
{
"epoch": 5.194508009153318,
"grad_norm": 0.476018360455716,
"learning_rate": 7.579548631314919e-06,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22604842483997345,
"step": 6810,
"valid_targets_mean": 4041.0,
"valid_targets_min": 1198
},
{
"epoch": 5.198321891685736,
"grad_norm": 0.4746406522279334,
"learning_rate": 7.549756882599262e-06,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2810885012149811,
"step": 6815,
"valid_targets_mean": 4864.0,
"valid_targets_min": 348
},
{
"epoch": 5.202135774218154,
"grad_norm": 0.44123239571536454,
"learning_rate": 7.520010170164897e-06,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29340696334838867,
"step": 6820,
"valid_targets_mean": 4571.4,
"valid_targets_min": 1294
},
{
"epoch": 5.2059496567505725,
"grad_norm": 0.5181410495929143,
"learning_rate": 7.490308601614633e-06,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3056938648223877,
"step": 6825,
"valid_targets_mean": 3920.4,
"valid_targets_min": 934
},
{
"epoch": 5.20976353928299,
"grad_norm": 0.43776302603903644,
"learning_rate": 7.460652284388006e-06,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2616339325904846,
"step": 6830,
"valid_targets_mean": 4601.6,
"valid_targets_min": 863
},
{
"epoch": 5.213577421815408,
"grad_norm": 0.4420958323537919,
"learning_rate": 7.431041325760842e-06,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28292545676231384,
"step": 6835,
"valid_targets_mean": 4929.3,
"valid_targets_min": 981
},
{
"epoch": 5.217391304347826,
"grad_norm": 0.44810324346126695,
"learning_rate": 7.4014758328449134e-06,
"loss": 0.282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2579541802406311,
"step": 6840,
"valid_targets_mean": 4549.0,
"valid_targets_min": 1071
},
{
"epoch": 5.221205186880244,
"grad_norm": 0.461760509560138,
"learning_rate": 7.3719559125875055e-06,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631801664829254,
"step": 6845,
"valid_targets_mean": 4591.1,
"valid_targets_min": 1050
},
{
"epoch": 5.225019069412662,
"grad_norm": 0.44979052496347216,
"learning_rate": 7.342481671771069e-06,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3014061152935028,
"step": 6850,
"valid_targets_mean": 4955.3,
"valid_targets_min": 935
},
{
"epoch": 5.22883295194508,
"grad_norm": 0.45496952765153387,
"learning_rate": 7.313053217012827e-06,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2862650752067566,
"step": 6855,
"valid_targets_mean": 4854.8,
"valid_targets_min": 1379
},
{
"epoch": 5.232646834477498,
"grad_norm": 0.4852937715560849,
"learning_rate": 7.28367065476435e-06,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27204573154449463,
"step": 6860,
"valid_targets_mean": 4125.8,
"valid_targets_min": 1221
},
{
"epoch": 5.236460717009916,
"grad_norm": 0.4984472817633318,
"learning_rate": 7.254334091311239e-06,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766822576522827,
"step": 6865,
"valid_targets_mean": 4148.9,
"valid_targets_min": 1389
},
{
"epoch": 5.240274599542334,
"grad_norm": 0.5046422054288014,
"learning_rate": 7.225043632772666e-06,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23229973018169403,
"step": 6870,
"valid_targets_mean": 3703.2,
"valid_targets_min": 1119
},
{
"epoch": 5.244088482074752,
"grad_norm": 0.47075224858655285,
"learning_rate": 7.195799385101066e-06,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21081803739070892,
"step": 6875,
"valid_targets_mean": 4031.1,
"valid_targets_min": 1148
},
{
"epoch": 5.24790236460717,
"grad_norm": 1.06539071338913,
"learning_rate": 7.166601454081674e-06,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39799293875694275,
"step": 6880,
"valid_targets_mean": 1204.7,
"valid_targets_min": 562
},
{
"epoch": 5.251716247139588,
"grad_norm": 0.8053847363374328,
"learning_rate": 7.1374499453322265e-06,
"loss": 0.448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3278617262840271,
"step": 6885,
"valid_targets_mean": 1777.9,
"valid_targets_min": 629
},
{
"epoch": 5.255530129672006,
"grad_norm": 0.49179591973926917,
"learning_rate": 7.108344964302499e-06,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707764208316803,
"step": 6890,
"valid_targets_mean": 4019.2,
"valid_targets_min": 610
},
{
"epoch": 5.259344012204424,
"grad_norm": 0.4672780099759257,
"learning_rate": 7.079286616273986e-06,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21976228058338165,
"step": 6895,
"valid_targets_mean": 4157.5,
"valid_targets_min": 1035
},
{
"epoch": 5.2631578947368425,
"grad_norm": 0.44433342694406336,
"learning_rate": 7.050275006359493e-06,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29698076844215393,
"step": 6900,
"valid_targets_mean": 5283.3,
"valid_targets_min": 1131
},
{
"epoch": 5.26697177726926,
"grad_norm": 0.5223006039476878,
"learning_rate": 7.0213102395027475e-06,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27178704738616943,
"step": 6905,
"valid_targets_mean": 3426.8,
"valid_targets_min": 1044
},
{
"epoch": 5.270785659801678,
"grad_norm": 0.4809130633033059,
"learning_rate": 6.9923924204780495e-06,
"loss": 0.2789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2610607147216797,
"step": 6910,
"valid_targets_mean": 4059.3,
"valid_targets_min": 385
},
{
"epoch": 5.274599542334096,
"grad_norm": 0.5044092120968204,
"learning_rate": 6.963521653889853e-06,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28660058975219727,
"step": 6915,
"valid_targets_mean": 4845.2,
"valid_targets_min": 978
},
{
"epoch": 5.278413424866514,
"grad_norm": 0.5104496438847528,
"learning_rate": 6.934698044172435e-06,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24992434680461884,
"step": 6920,
"valid_targets_mean": 3877.2,
"valid_targets_min": 468
},
{
"epoch": 5.282227307398932,
"grad_norm": 0.5110715915878371,
"learning_rate": 6.905921695589461e-06,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24427704513072968,
"step": 6925,
"valid_targets_mean": 4894.0,
"valid_targets_min": 1049
},
{
"epoch": 5.28604118993135,
"grad_norm": 0.4788393046415271,
"learning_rate": 6.877192712233673e-06,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2587161362171173,
"step": 6930,
"valid_targets_mean": 4604.5,
"valid_targets_min": 1024
},
{
"epoch": 5.2898550724637685,
"grad_norm": 0.5212077492613079,
"learning_rate": 6.8485111980264485e-06,
"loss": 0.2513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25677958130836487,
"step": 6935,
"valid_targets_mean": 4370.5,
"valid_targets_min": 1018
},
{
"epoch": 5.293668954996186,
"grad_norm": 0.5081127694045978,
"learning_rate": 6.819877256717471e-06,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2486242800951004,
"step": 6940,
"valid_targets_mean": 3836.2,
"valid_targets_min": 336
},
{
"epoch": 5.297482837528604,
"grad_norm": 0.46264486257794624,
"learning_rate": 6.791290991884343e-06,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2491236925125122,
"step": 6945,
"valid_targets_mean": 4162.0,
"valid_targets_min": 1472
},
{
"epoch": 5.301296720061022,
"grad_norm": 0.5517594238630391,
"learning_rate": 6.762752506932186e-06,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23130156099796295,
"step": 6950,
"valid_targets_mean": 4125.0,
"valid_targets_min": 1314
},
{
"epoch": 5.30511060259344,
"grad_norm": 0.5117419037061384,
"learning_rate": 6.734261905093315e-06,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29466712474823,
"step": 6955,
"valid_targets_mean": 4019.8,
"valid_targets_min": 1289
},
{
"epoch": 5.308924485125858,
"grad_norm": 0.4774587493320638,
"learning_rate": 6.705819289426807e-06,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23725992441177368,
"step": 6960,
"valid_targets_mean": 4301.6,
"valid_targets_min": 504
},
{
"epoch": 5.312738367658276,
"grad_norm": 0.4367236063617533,
"learning_rate": 6.67742476281819e-06,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27271658182144165,
"step": 6965,
"valid_targets_mean": 4865.9,
"valid_targets_min": 1739
},
{
"epoch": 5.3165522501906946,
"grad_norm": 0.5402725692551985,
"learning_rate": 6.649078427979008e-06,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31718483567237854,
"step": 6970,
"valid_targets_mean": 3822.7,
"valid_targets_min": 674
},
{
"epoch": 5.320366132723112,
"grad_norm": 0.5475992817437416,
"learning_rate": 6.62078038744651e-06,
"loss": 0.2461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2607622444629669,
"step": 6975,
"valid_targets_mean": 3495.9,
"valid_targets_min": 274
},
{
"epoch": 5.32418001525553,
"grad_norm": 0.44930905451217984,
"learning_rate": 6.592530743583223e-06,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23356647789478302,
"step": 6980,
"valid_targets_mean": 4413.0,
"valid_targets_min": 1244
},
{
"epoch": 5.327993897787948,
"grad_norm": 0.49257972443447445,
"learning_rate": 6.564329598576631e-06,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3146706521511078,
"step": 6985,
"valid_targets_mean": 4495.7,
"valid_targets_min": 919
},
{
"epoch": 5.331807780320366,
"grad_norm": 0.4915267580498807,
"learning_rate": 6.536177054438777e-06,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2633446455001831,
"step": 6990,
"valid_targets_mean": 4100.7,
"valid_targets_min": 1543
},
{
"epoch": 5.335621662852784,
"grad_norm": 0.527306128608921,
"learning_rate": 6.508073213005886e-06,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28533294796943665,
"step": 6995,
"valid_targets_mean": 3935.1,
"valid_targets_min": 890
},
{
"epoch": 5.339435545385202,
"grad_norm": 0.49659900179345723,
"learning_rate": 6.480018175938032e-06,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2267284244298935,
"step": 7000,
"valid_targets_mean": 3676.0,
"valid_targets_min": 1351
},
{
"epoch": 5.34324942791762,
"grad_norm": 0.431485347943722,
"learning_rate": 6.4520120447187366e-06,
"loss": 0.279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27338099479675293,
"step": 7005,
"valid_targets_mean": 5130.5,
"valid_targets_min": 1279
},
{
"epoch": 5.3470633104500385,
"grad_norm": 0.4509333030627232,
"learning_rate": 6.424054920654607e-06,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27152150869369507,
"step": 7010,
"valid_targets_mean": 4593.5,
"valid_targets_min": 1281
},
{
"epoch": 5.350877192982456,
"grad_norm": 0.4756213671492397,
"learning_rate": 6.396146904875001e-06,
"loss": 0.2675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602352201938629,
"step": 7015,
"valid_targets_mean": 4143.6,
"valid_targets_min": 1026
},
{
"epoch": 5.354691075514874,
"grad_norm": 0.4366604334192552,
"learning_rate": 6.368288098331605e-06,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2461734563112259,
"step": 7020,
"valid_targets_mean": 4280.2,
"valid_targets_min": 1094
},
{
"epoch": 5.358504958047292,
"grad_norm": 0.49410785049881645,
"learning_rate": 6.340478601798132e-06,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26815125346183777,
"step": 7025,
"valid_targets_mean": 4111.7,
"valid_targets_min": 1306
},
{
"epoch": 5.36231884057971,
"grad_norm": 0.45759646347454747,
"learning_rate": 6.312718515869902e-06,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22155439853668213,
"step": 7030,
"valid_targets_mean": 4103.8,
"valid_targets_min": 447
},
{
"epoch": 5.366132723112128,
"grad_norm": 0.4845186523017412,
"learning_rate": 6.285007940963519e-06,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27183595299720764,
"step": 7035,
"valid_targets_mean": 3842.2,
"valid_targets_min": 395
},
{
"epoch": 5.369946605644546,
"grad_norm": 0.4573500237101827,
"learning_rate": 6.257346977316474e-06,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2306838482618332,
"step": 7040,
"valid_targets_mean": 4493.4,
"valid_targets_min": 1671
},
{
"epoch": 5.3737604881769645,
"grad_norm": 0.9156027305404644,
"learning_rate": 6.229735724986821e-06,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3673783540725708,
"step": 7045,
"valid_targets_mean": 1448.0,
"valid_targets_min": 675
},
{
"epoch": 5.377574370709382,
"grad_norm": 0.5348366671099393,
"learning_rate": 6.202174283852766e-06,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2646300494670868,
"step": 7050,
"valid_targets_mean": 4003.0,
"valid_targets_min": 1379
},
{
"epoch": 5.3813882532418,
"grad_norm": 0.4493967568819422,
"learning_rate": 6.174662753612355e-06,
"loss": 0.2824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2676180601119995,
"step": 7055,
"valid_targets_mean": 4638.2,
"valid_targets_min": 1044
},
{
"epoch": 5.385202135774218,
"grad_norm": 0.44339585866075004,
"learning_rate": 6.147201233783087e-06,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2779521048069,
"step": 7060,
"valid_targets_mean": 4827.2,
"valid_targets_min": 416
},
{
"epoch": 5.389016018306636,
"grad_norm": 0.4916923429041741,
"learning_rate": 6.119789823701548e-06,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26473018527030945,
"step": 7065,
"valid_targets_mean": 4566.0,
"valid_targets_min": 1278
},
{
"epoch": 5.392829900839054,
"grad_norm": 0.4666991074580145,
"learning_rate": 6.092428622523074e-06,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3047803044319153,
"step": 7070,
"valid_targets_mean": 5045.8,
"valid_targets_min": 1274
},
{
"epoch": 5.396643783371472,
"grad_norm": 0.4567416421356613,
"learning_rate": 6.065117729221368e-06,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2584697902202606,
"step": 7075,
"valid_targets_mean": 4706.9,
"valid_targets_min": 1275
},
{
"epoch": 5.4004576659038905,
"grad_norm": 0.44314444752444254,
"learning_rate": 6.037857242588172e-06,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23497982323169708,
"step": 7080,
"valid_targets_mean": 4559.0,
"valid_targets_min": 1282
},
{
"epoch": 5.404271548436308,
"grad_norm": 0.48014425623093515,
"learning_rate": 6.01064726123287e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25778788328170776,
"step": 7085,
"valid_targets_mean": 4872.2,
"valid_targets_min": 587
},
{
"epoch": 5.408085430968726,
"grad_norm": 0.45115923207142167,
"learning_rate": 5.983487883582176e-06,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704853117465973,
"step": 7090,
"valid_targets_mean": 5120.1,
"valid_targets_min": 531
},
{
"epoch": 5.411899313501144,
"grad_norm": 0.4945409660156044,
"learning_rate": 5.9563792078797275e-06,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2888518273830414,
"step": 7095,
"valid_targets_mean": 5236.5,
"valid_targets_min": 1493
},
{
"epoch": 5.415713196033562,
"grad_norm": 0.4567007952044338,
"learning_rate": 5.9293213321857865e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22163493931293488,
"step": 7100,
"valid_targets_mean": 4193.8,
"valid_targets_min": 1929
},
{
"epoch": 5.41952707856598,
"grad_norm": 0.4842090926003661,
"learning_rate": 5.902314354376845e-06,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25373324751853943,
"step": 7105,
"valid_targets_mean": 4655.1,
"valid_targets_min": 1354
},
{
"epoch": 5.423340961098398,
"grad_norm": 0.41473599298153047,
"learning_rate": 5.87535837214527e-06,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26143643260002136,
"step": 7110,
"valid_targets_mean": 5557.0,
"valid_targets_min": 1151
},
{
"epoch": 5.427154843630817,
"grad_norm": 0.4441541614997986,
"learning_rate": 5.848453482998986e-06,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2161817103624344,
"step": 7115,
"valid_targets_mean": 4495.2,
"valid_targets_min": 999
},
{
"epoch": 5.4309687261632345,
"grad_norm": 0.4471035984291613,
"learning_rate": 5.8215997842610695e-06,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28700459003448486,
"step": 7120,
"valid_targets_mean": 4882.1,
"valid_targets_min": 987
},
{
"epoch": 5.434782608695652,
"grad_norm": 0.47288529174681054,
"learning_rate": 5.794797373069454e-06,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508050799369812,
"step": 7125,
"valid_targets_mean": 4713.7,
"valid_targets_min": 1686
},
{
"epoch": 5.43859649122807,
"grad_norm": 0.4960945585855858,
"learning_rate": 5.768046346376528e-06,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533581256866455,
"step": 7130,
"valid_targets_mean": 3984.4,
"valid_targets_min": 977
},
{
"epoch": 5.442410373760488,
"grad_norm": 0.49188617193973644,
"learning_rate": 5.7413468009488284e-06,
"loss": 0.2334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20482134819030762,
"step": 7135,
"valid_targets_mean": 3737.5,
"valid_targets_min": 354
},
{
"epoch": 5.446224256292906,
"grad_norm": 0.6000775297843542,
"learning_rate": 5.714698833366641e-06,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2533903419971466,
"step": 7140,
"valid_targets_mean": 3571.9,
"valid_targets_min": 1005
},
{
"epoch": 5.450038138825324,
"grad_norm": 0.45340382274911345,
"learning_rate": 5.688102540023705e-06,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2805597484111786,
"step": 7145,
"valid_targets_mean": 5255.7,
"valid_targets_min": 750
},
{
"epoch": 5.453852021357742,
"grad_norm": 0.4410601983842463,
"learning_rate": 5.661558017126834e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2243202179670334,
"step": 7150,
"valid_targets_mean": 4318.8,
"valid_targets_min": 1350
},
{
"epoch": 5.4576659038901605,
"grad_norm": 0.466304205959976,
"learning_rate": 5.635065360695555e-06,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674126625061035,
"step": 7155,
"valid_targets_mean": 4463.6,
"valid_targets_min": 1353
},
{
"epoch": 5.461479786422578,
"grad_norm": 0.47987541986780025,
"learning_rate": 5.608624666561799e-06,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2757456302642822,
"step": 7160,
"valid_targets_mean": 4238.0,
"valid_targets_min": 495
},
{
"epoch": 5.465293668954996,
"grad_norm": 0.4723114447122454,
"learning_rate": 5.582236030369514e-06,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29881516098976135,
"step": 7165,
"valid_targets_mean": 5455.1,
"valid_targets_min": 1228
},
{
"epoch": 5.469107551487414,
"grad_norm": 0.47351422373374047,
"learning_rate": 5.5558995475743635e-06,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28124120831489563,
"step": 7170,
"valid_targets_mean": 4546.2,
"valid_targets_min": 1467
},
{
"epoch": 5.472921434019832,
"grad_norm": 0.4581850087130719,
"learning_rate": 5.529615313443328e-06,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.263645738363266,
"step": 7175,
"valid_targets_mean": 4665.4,
"valid_targets_min": 1231
},
{
"epoch": 5.47673531655225,
"grad_norm": 0.44445804803224537,
"learning_rate": 5.503383423054418e-06,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29965755343437195,
"step": 7180,
"valid_targets_mean": 4919.1,
"valid_targets_min": 401
},
{
"epoch": 5.480549199084669,
"grad_norm": 0.48072448807053203,
"learning_rate": 5.47720397129627e-06,
"loss": 0.2816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851342558860779,
"step": 7185,
"valid_targets_mean": 3921.5,
"valid_targets_min": 807
},
{
"epoch": 5.4843630816170865,
"grad_norm": 0.5429782499885556,
"learning_rate": 5.451077052867859e-06,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23518866300582886,
"step": 7190,
"valid_targets_mean": 3978.4,
"valid_targets_min": 715
},
{
"epoch": 5.488176964149504,
"grad_norm": 0.5600448299096479,
"learning_rate": 5.425002762278127e-06,
"loss": 0.2463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23407478630542755,
"step": 7195,
"valid_targets_mean": 3173.8,
"valid_targets_min": 933
},
{
"epoch": 5.491990846681922,
"grad_norm": 0.5169549649125209,
"learning_rate": 5.39898119384563e-06,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2725510895252228,
"step": 7200,
"valid_targets_mean": 4044.9,
"valid_targets_min": 1272
},
{
"epoch": 5.49580472921434,
"grad_norm": 0.5459825367677725,
"learning_rate": 5.373012441698235e-06,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2436116337776184,
"step": 7205,
"valid_targets_mean": 3122.2,
"valid_targets_min": 457
},
{
"epoch": 5.499618611746758,
"grad_norm": 0.6737293290695994,
"learning_rate": 5.347096599772732e-06,
"loss": 0.4182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28409695625305176,
"step": 7210,
"valid_targets_mean": 2758.2,
"valid_targets_min": 574
},
{
"epoch": 5.503432494279176,
"grad_norm": 0.47869919663122357,
"learning_rate": 5.3212337618145416e-06,
"loss": 0.2654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792750895023346,
"step": 7215,
"valid_targets_mean": 4658.0,
"valid_targets_min": 1364
},
{
"epoch": 5.507246376811594,
"grad_norm": 0.46056094352248905,
"learning_rate": 5.295424021377331e-06,
"loss": 0.2504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25706204771995544,
"step": 7220,
"valid_targets_mean": 4113.9,
"valid_targets_min": 815
},
{
"epoch": 5.511060259344013,
"grad_norm": 0.4464065222279077,
"learning_rate": 5.269667471822721e-06,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23010754585266113,
"step": 7225,
"valid_targets_mean": 4441.2,
"valid_targets_min": 1100
},
{
"epoch": 5.51487414187643,
"grad_norm": 0.4534242612135644,
"learning_rate": 5.243964206319905e-06,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25065717101097107,
"step": 7230,
"valid_targets_mean": 4198.2,
"valid_targets_min": 967
},
{
"epoch": 5.518688024408848,
"grad_norm": 0.4465601339441509,
"learning_rate": 5.218314317845341e-06,
"loss": 0.2652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2715952694416046,
"step": 7235,
"valid_targets_mean": 5195.9,
"valid_targets_min": 1113
},
{
"epoch": 5.522501906941266,
"grad_norm": 0.49623684714776733,
"learning_rate": 5.192717899182414e-06,
"loss": 0.2774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2818422019481659,
"step": 7240,
"valid_targets_mean": 3791.5,
"valid_targets_min": 1313
},
{
"epoch": 5.526315789473684,
"grad_norm": 0.5387411414011866,
"learning_rate": 5.1671750429210706e-06,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26141834259033203,
"step": 7245,
"valid_targets_mean": 3960.7,
"valid_targets_min": 844
},
{
"epoch": 5.530129672006102,
"grad_norm": 0.4733982326591677,
"learning_rate": 5.141685841457531e-06,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717835307121277,
"step": 7250,
"valid_targets_mean": 4288.9,
"valid_targets_min": 1040
},
{
"epoch": 5.53394355453852,
"grad_norm": 0.4560601736804632,
"learning_rate": 5.116250386993908e-06,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23000472784042358,
"step": 7255,
"valid_targets_mean": 3966.4,
"valid_targets_min": 1084
},
{
"epoch": 5.537757437070939,
"grad_norm": 0.45789216879423134,
"learning_rate": 5.090868771537918e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2920645773410797,
"step": 7260,
"valid_targets_mean": 5077.2,
"valid_targets_min": 1141
},
{
"epoch": 5.5415713196033565,
"grad_norm": 0.46197101608486557,
"learning_rate": 5.065541086902499e-06,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24757897853851318,
"step": 7265,
"valid_targets_mean": 4411.2,
"valid_targets_min": 1106
},
{
"epoch": 5.545385202135774,
"grad_norm": 0.49869011412423253,
"learning_rate": 5.040267424705531e-06,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26691606640815735,
"step": 7270,
"valid_targets_mean": 4098.8,
"valid_targets_min": 881
},
{
"epoch": 5.549199084668192,
"grad_norm": 0.46561034630392756,
"learning_rate": 5.015047876369456e-06,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2835874557495117,
"step": 7275,
"valid_targets_mean": 4925.6,
"valid_targets_min": 1056
},
{
"epoch": 5.55301296720061,
"grad_norm": 0.49268173538897586,
"learning_rate": 4.989882533120985e-06,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28856849670410156,
"step": 7280,
"valid_targets_mean": 4464.0,
"valid_targets_min": 1397
},
{
"epoch": 5.556826849733028,
"grad_norm": 0.5405525220524633,
"learning_rate": 4.964771485990753e-06,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24683456122875214,
"step": 7285,
"valid_targets_mean": 3427.6,
"valid_targets_min": 850
},
{
"epoch": 5.560640732265446,
"grad_norm": 0.522144174272764,
"learning_rate": 4.939714825812976e-06,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2464541345834732,
"step": 7290,
"valid_targets_mean": 3456.2,
"valid_targets_min": 928
},
{
"epoch": 5.564454614797864,
"grad_norm": 0.4972765834947173,
"learning_rate": 4.914712643225155e-06,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27163538336753845,
"step": 7295,
"valid_targets_mean": 4422.6,
"valid_targets_min": 1164
},
{
"epoch": 5.5682684973302825,
"grad_norm": 0.46118503283223744,
"learning_rate": 4.889765028667706e-06,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30164602398872375,
"step": 7300,
"valid_targets_mean": 5380.8,
"valid_targets_min": 1094
},
{
"epoch": 5.5720823798627,
"grad_norm": 0.41517681084142244,
"learning_rate": 4.8648720723836815e-06,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2422560453414917,
"step": 7305,
"valid_targets_mean": 5003.5,
"valid_targets_min": 1181
},
{
"epoch": 5.575896262395118,
"grad_norm": 0.519351689521643,
"learning_rate": 4.840033864418394e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.278678297996521,
"step": 7310,
"valid_targets_mean": 3523.4,
"valid_targets_min": 652
},
{
"epoch": 5.579710144927536,
"grad_norm": 0.4491216603709415,
"learning_rate": 4.815250494619142e-06,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2643551826477051,
"step": 7315,
"valid_targets_mean": 4933.9,
"valid_targets_min": 887
},
{
"epoch": 5.583524027459954,
"grad_norm": 0.49558408715788765,
"learning_rate": 4.790522052634832e-06,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29052674770355225,
"step": 7320,
"valid_targets_mean": 3924.8,
"valid_targets_min": 909
},
{
"epoch": 5.587337909992372,
"grad_norm": 0.4408746776163538,
"learning_rate": 4.7658486279156855e-06,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2446516901254654,
"step": 7325,
"valid_targets_mean": 4569.1,
"valid_targets_min": 1411
},
{
"epoch": 5.591151792524791,
"grad_norm": 0.4717219750374338,
"learning_rate": 4.74123030971293e-06,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24252106249332428,
"step": 7330,
"valid_targets_mean": 4408.3,
"valid_targets_min": 1060
},
{
"epoch": 5.5949656750572085,
"grad_norm": 0.4964043406119739,
"learning_rate": 4.716667187078426e-06,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2528547942638397,
"step": 7335,
"valid_targets_mean": 3936.3,
"valid_targets_min": 1230
},
{
"epoch": 5.598779557589626,
"grad_norm": 0.46290044328099633,
"learning_rate": 4.692159348864405e-06,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23730583488941193,
"step": 7340,
"valid_targets_mean": 4176.9,
"valid_targets_min": 306
},
{
"epoch": 5.602593440122044,
"grad_norm": 0.526359122756289,
"learning_rate": 4.667706883723089e-06,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23432885110378265,
"step": 7345,
"valid_targets_mean": 3812.0,
"valid_targets_min": 917
},
{
"epoch": 5.606407322654462,
"grad_norm": 0.4488365832771667,
"learning_rate": 4.6433098801064216e-06,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22697098553180695,
"step": 7350,
"valid_targets_mean": 4373.7,
"valid_targets_min": 991
},
{
"epoch": 5.61022120518688,
"grad_norm": 0.4454358707434032,
"learning_rate": 4.61896842626572e-06,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983551323413849,
"step": 7355,
"valid_targets_mean": 5246.0,
"valid_targets_min": 927
},
{
"epoch": 5.614035087719298,
"grad_norm": 0.4353310092624839,
"learning_rate": 4.594682610251349e-06,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2707470655441284,
"step": 7360,
"valid_targets_mean": 5198.0,
"valid_targets_min": 1305
},
{
"epoch": 5.617848970251716,
"grad_norm": 0.4924961276507448,
"learning_rate": 4.570452519912434e-06,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22331412136554718,
"step": 7365,
"valid_targets_mean": 3868.3,
"valid_targets_min": 840
},
{
"epoch": 5.621662852784135,
"grad_norm": 0.49740165985344104,
"learning_rate": 4.5462782428965e-06,
"loss": 0.2807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26943090558052063,
"step": 7370,
"valid_targets_mean": 4378.5,
"valid_targets_min": 1324
},
{
"epoch": 5.6254767353165525,
"grad_norm": 1.4631518670559964,
"learning_rate": 4.52215986664921e-06,
"loss": 0.4228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42682841420173645,
"step": 7375,
"valid_targets_mean": 834.8,
"valid_targets_min": 622
},
{
"epoch": 5.62929061784897,
"grad_norm": 0.4760786300585858,
"learning_rate": 4.498097478413981e-06,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24382078647613525,
"step": 7380,
"valid_targets_mean": 4504.2,
"valid_targets_min": 356
},
{
"epoch": 5.633104500381388,
"grad_norm": 0.4626734833552102,
"learning_rate": 4.474091165231737e-06,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557976543903351,
"step": 7385,
"valid_targets_mean": 4257.1,
"valid_targets_min": 1598
},
{
"epoch": 5.636918382913806,
"grad_norm": 0.4742996077597775,
"learning_rate": 4.450141013940534e-06,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23813612759113312,
"step": 7390,
"valid_targets_mean": 4133.5,
"valid_targets_min": 1372
},
{
"epoch": 5.640732265446224,
"grad_norm": 0.45938048208501386,
"learning_rate": 4.426247111175297e-06,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21757149696350098,
"step": 7395,
"valid_targets_mean": 4052.1,
"valid_targets_min": 657
},
{
"epoch": 5.644546147978643,
"grad_norm": 0.46051709275793706,
"learning_rate": 4.402409543367472e-06,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812298536300659,
"step": 7400,
"valid_targets_mean": 4681.9,
"valid_targets_min": 946
},
{
"epoch": 5.648360030511061,
"grad_norm": 0.4520687879121962,
"learning_rate": 4.378628396744717e-06,
"loss": 0.2829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29354262351989746,
"step": 7405,
"valid_targets_mean": 5111.8,
"valid_targets_min": 1202
},
{
"epoch": 5.6521739130434785,
"grad_norm": 0.45662177723316266,
"learning_rate": 4.354903757330619e-06,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29141366481781006,
"step": 7410,
"valid_targets_mean": 5248.5,
"valid_targets_min": 1118
},
{
"epoch": 5.655987795575896,
"grad_norm": 0.5798114965925926,
"learning_rate": 4.3312357109443345e-06,
"loss": 0.2684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26307177543640137,
"step": 7415,
"valid_targets_mean": 4735.7,
"valid_targets_min": 1169
},
{
"epoch": 5.659801678108314,
"grad_norm": 0.4632669903920861,
"learning_rate": 4.307624343200332e-06,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24400150775909424,
"step": 7420,
"valid_targets_mean": 4341.5,
"valid_targets_min": 514
},
{
"epoch": 5.663615560640732,
"grad_norm": 0.47567506904850365,
"learning_rate": 4.284069739508032e-06,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501218914985657,
"step": 7425,
"valid_targets_mean": 4060.4,
"valid_targets_min": 793
},
{
"epoch": 5.66742944317315,
"grad_norm": 0.4784400024841789,
"learning_rate": 4.2605719850715445e-06,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24574881792068481,
"step": 7430,
"valid_targets_mean": 4294.8,
"valid_targets_min": 943
},
{
"epoch": 5.671243325705568,
"grad_norm": 0.5133347500185746,
"learning_rate": 4.237131164889321e-06,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27007922530174255,
"step": 7435,
"valid_targets_mean": 4046.4,
"valid_targets_min": 1159
},
{
"epoch": 5.675057208237987,
"grad_norm": 0.4539076379605323,
"learning_rate": 4.213747363753875e-06,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24426043033599854,
"step": 7440,
"valid_targets_mean": 4678.9,
"valid_targets_min": 1080
},
{
"epoch": 5.6788710907704045,
"grad_norm": 0.4619730738815801,
"learning_rate": 4.190420666251467e-06,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22337813675403595,
"step": 7445,
"valid_targets_mean": 4274.1,
"valid_targets_min": 1006
},
{
"epoch": 5.682684973302822,
"grad_norm": 0.5289760710330429,
"learning_rate": 4.1671511567617816e-06,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23961704969406128,
"step": 7450,
"valid_targets_mean": 3701.7,
"valid_targets_min": 1264
},
{
"epoch": 5.68649885583524,
"grad_norm": 0.4077567627073792,
"learning_rate": 4.143938919457659e-06,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22072581946849823,
"step": 7455,
"valid_targets_mean": 5214.0,
"valid_targets_min": 1596
},
{
"epoch": 5.690312738367658,
"grad_norm": 0.5715728165292766,
"learning_rate": 4.120784038304743e-06,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26193735003471375,
"step": 7460,
"valid_targets_mean": 3611.3,
"valid_targets_min": 906
},
{
"epoch": 5.694126620900076,
"grad_norm": 0.5026260419778403,
"learning_rate": 4.0976865970612305e-06,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22939319908618927,
"step": 7465,
"valid_targets_mean": 3772.9,
"valid_targets_min": 431
},
{
"epoch": 5.697940503432494,
"grad_norm": 0.47404174633602586,
"learning_rate": 4.074646679277514e-06,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25620734691619873,
"step": 7470,
"valid_targets_mean": 4115.8,
"valid_targets_min": 843
},
{
"epoch": 5.701754385964913,
"grad_norm": 0.44644681572700895,
"learning_rate": 4.051664368295931e-06,
"loss": 0.2564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22743135690689087,
"step": 7475,
"valid_targets_mean": 4980.8,
"valid_targets_min": 2055
},
{
"epoch": 5.705568268497331,
"grad_norm": 0.4762637154157596,
"learning_rate": 4.028739747250414e-06,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29567673802375793,
"step": 7480,
"valid_targets_mean": 5021.9,
"valid_targets_min": 1334
},
{
"epoch": 5.709382151029748,
"grad_norm": 0.5331830444355757,
"learning_rate": 4.005872899066232e-06,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26421937346458435,
"step": 7485,
"valid_targets_mean": 3504.0,
"valid_targets_min": 994
},
{
"epoch": 5.713196033562166,
"grad_norm": 0.47084261096423663,
"learning_rate": 3.983063906459672e-06,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260171502828598,
"step": 7490,
"valid_targets_mean": 4280.6,
"valid_targets_min": 1070
},
{
"epoch": 5.717009916094584,
"grad_norm": 0.5009028299599818,
"learning_rate": 3.960312851937722e-06,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721886932849884,
"step": 7495,
"valid_targets_mean": 4046.6,
"valid_targets_min": 1336
},
{
"epoch": 5.720823798627002,
"grad_norm": 0.5466785269273442,
"learning_rate": 3.937619817797813e-06,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26342272758483887,
"step": 7500,
"valid_targets_mean": 4143.9,
"valid_targets_min": 859
},
{
"epoch": 5.72463768115942,
"grad_norm": 0.419718247363952,
"learning_rate": 3.9149848861274795e-06,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27253589034080505,
"step": 7505,
"valid_targets_mean": 5215.9,
"valid_targets_min": 1424
},
{
"epoch": 5.728451563691838,
"grad_norm": 0.46579609883184436,
"learning_rate": 3.8924081388040976e-06,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24933433532714844,
"step": 7510,
"valid_targets_mean": 4956.2,
"valid_targets_min": 1100
},
{
"epoch": 5.732265446224257,
"grad_norm": 0.5163794532026748,
"learning_rate": 3.869889657494559e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27208736538887024,
"step": 7515,
"valid_targets_mean": 4663.0,
"valid_targets_min": 1162
},
{
"epoch": 5.7360793287566745,
"grad_norm": 0.48502196089198857,
"learning_rate": 3.847429523655004e-06,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23235277831554413,
"step": 7520,
"valid_targets_mean": 4345.2,
"valid_targets_min": 1173
},
{
"epoch": 5.739893211289092,
"grad_norm": 0.48209817050203563,
"learning_rate": 3.825027818530498e-06,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796691954135895,
"step": 7525,
"valid_targets_mean": 5048.5,
"valid_targets_min": 467
},
{
"epoch": 5.74370709382151,
"grad_norm": 0.4449831601562535,
"learning_rate": 3.802684623154762e-06,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2815805673599243,
"step": 7530,
"valid_targets_mean": 5262.2,
"valid_targets_min": 1557
},
{
"epoch": 5.747520976353928,
"grad_norm": 0.4479873081666714,
"learning_rate": 3.780400018349872e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27081429958343506,
"step": 7535,
"valid_targets_mean": 5022.8,
"valid_targets_min": 1333
},
{
"epoch": 5.751334858886346,
"grad_norm": 1.3471935076076935,
"learning_rate": 3.7581740847259495e-06,
"loss": 0.3821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4470458924770355,
"step": 7540,
"valid_targets_mean": 882.6,
"valid_targets_min": 583
},
{
"epoch": 5.755148741418765,
"grad_norm": 0.4781128038840103,
"learning_rate": 3.736006902680904e-06,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2608310282230377,
"step": 7545,
"valid_targets_mean": 4537.0,
"valid_targets_min": 843
},
{
"epoch": 5.758962623951183,
"grad_norm": 0.5659433332480197,
"learning_rate": 3.7138985524001057e-06,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31279221177101135,
"step": 7550,
"valid_targets_mean": 4426.8,
"valid_targets_min": 1103
},
{
"epoch": 5.7627765064836005,
"grad_norm": 0.4962767932946681,
"learning_rate": 3.691849113856125e-06,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.219892218708992,
"step": 7555,
"valid_targets_mean": 3565.2,
"valid_targets_min": 1013
},
{
"epoch": 5.766590389016018,
"grad_norm": 0.6270615848107953,
"learning_rate": 3.6698586668084214e-06,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2851230800151825,
"step": 7560,
"valid_targets_mean": 5459.8,
"valid_targets_min": 1291
},
{
"epoch": 5.770404271548436,
"grad_norm": 0.5020336137990338,
"learning_rate": 3.647927290803075e-06,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2942732572555542,
"step": 7565,
"valid_targets_mean": 4056.2,
"valid_targets_min": 1102
},
{
"epoch": 5.774218154080854,
"grad_norm": 0.47840297911651897,
"learning_rate": 3.6260550651724735e-06,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23049987852573395,
"step": 7570,
"valid_targets_mean": 4130.0,
"valid_targets_min": 327
},
{
"epoch": 5.778032036613272,
"grad_norm": 0.45812668366800213,
"learning_rate": 3.604242069035051e-06,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24633507430553436,
"step": 7575,
"valid_targets_mean": 4542.7,
"valid_targets_min": 1212
},
{
"epoch": 5.78184591914569,
"grad_norm": 0.4789571096088359,
"learning_rate": 3.582488381294997e-06,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.254001647233963,
"step": 7580,
"valid_targets_mean": 4604.6,
"valid_targets_min": 420
},
{
"epoch": 5.785659801678109,
"grad_norm": 0.4915261483074165,
"learning_rate": 3.560794080641943e-06,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2834867537021637,
"step": 7585,
"valid_targets_mean": 4501.2,
"valid_targets_min": 1410
},
{
"epoch": 5.7894736842105265,
"grad_norm": 0.4302456126659898,
"learning_rate": 3.5391592455507207e-06,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23200945556163788,
"step": 7590,
"valid_targets_mean": 4676.2,
"valid_targets_min": 577
},
{
"epoch": 5.793287566742944,
"grad_norm": 0.5125700685274149,
"learning_rate": 3.517583954281041e-06,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26258015632629395,
"step": 7595,
"valid_targets_mean": 3732.4,
"valid_targets_min": 1297
},
{
"epoch": 5.797101449275362,
"grad_norm": 0.4926014789340449,
"learning_rate": 3.4960682848772432e-06,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2648114264011383,
"step": 7600,
"valid_targets_mean": 4162.2,
"valid_targets_min": 929
},
{
"epoch": 5.80091533180778,
"grad_norm": 0.471511291106976,
"learning_rate": 3.4746123151679777e-06,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23751680552959442,
"step": 7605,
"valid_targets_mean": 4355.8,
"valid_targets_min": 1475
},
{
"epoch": 5.804729214340198,
"grad_norm": 0.47994063760768335,
"learning_rate": 3.4532161227659635e-06,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726961374282837,
"step": 7610,
"valid_targets_mean": 4271.6,
"valid_targets_min": 877
},
{
"epoch": 5.808543096872616,
"grad_norm": 0.5263789521198493,
"learning_rate": 3.4318797850676643e-06,
"loss": 0.2817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2983848452568054,
"step": 7615,
"valid_targets_mean": 4016.3,
"valid_targets_min": 1584
},
{
"epoch": 5.812356979405035,
"grad_norm": 0.5441262014652823,
"learning_rate": 3.4106033792530503e-06,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29425832629203796,
"step": 7620,
"valid_targets_mean": 3834.4,
"valid_targets_min": 963
},
{
"epoch": 5.816170861937453,
"grad_norm": 0.4594189691390277,
"learning_rate": 3.3893869822852965e-06,
"loss": 0.2393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23714977502822876,
"step": 7625,
"valid_targets_mean": 4394.7,
"valid_targets_min": 971
},
{
"epoch": 5.8199847444698705,
"grad_norm": 0.44797174670219914,
"learning_rate": 3.368230670910495e-06,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24746312201023102,
"step": 7630,
"valid_targets_mean": 5370.3,
"valid_targets_min": 930
},
{
"epoch": 5.823798627002288,
"grad_norm": 0.45332363493811645,
"learning_rate": 3.3471345216574135e-06,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25578317046165466,
"step": 7635,
"valid_targets_mean": 4801.6,
"valid_targets_min": 1460
},
{
"epoch": 5.827612509534706,
"grad_norm": 0.5252092504310898,
"learning_rate": 3.326098610837165e-06,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27364540100097656,
"step": 7640,
"valid_targets_mean": 3530.9,
"valid_targets_min": 516
},
{
"epoch": 5.831426392067124,
"grad_norm": 0.4900065349858666,
"learning_rate": 3.3051230145429834e-06,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2814614474773407,
"step": 7645,
"valid_targets_mean": 5115.5,
"valid_targets_min": 1055
},
{
"epoch": 5.835240274599542,
"grad_norm": 0.44824989551867944,
"learning_rate": 3.2842078086499307e-06,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24113915860652924,
"step": 7650,
"valid_targets_mean": 4745.6,
"valid_targets_min": 1724
},
{
"epoch": 5.83905415713196,
"grad_norm": 0.4712181525145368,
"learning_rate": 3.2633530688145966e-06,
"loss": 0.2486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2545694410800934,
"step": 7655,
"valid_targets_mean": 4455.9,
"valid_targets_min": 1123
},
{
"epoch": 5.842868039664379,
"grad_norm": 0.4882489300080456,
"learning_rate": 3.24255887047487e-06,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780630886554718,
"step": 7660,
"valid_targets_mean": 4831.5,
"valid_targets_min": 1362
},
{
"epoch": 5.8466819221967965,
"grad_norm": 0.4102481126349075,
"learning_rate": 3.221825288849625e-06,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23655253648757935,
"step": 7665,
"valid_targets_mean": 5257.2,
"valid_targets_min": 2401
},
{
"epoch": 5.850495804729214,
"grad_norm": 0.4922948313278101,
"learning_rate": 3.201152398938483e-06,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2933632433414459,
"step": 7670,
"valid_targets_mean": 4272.6,
"valid_targets_min": 1201
},
{
"epoch": 5.854309687261632,
"grad_norm": 0.5009285178620376,
"learning_rate": 3.180540275521504e-06,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2608252465724945,
"step": 7675,
"valid_targets_mean": 4210.9,
"valid_targets_min": 1195
},
{
"epoch": 5.85812356979405,
"grad_norm": 0.4788458917234944,
"learning_rate": 3.1599889931589644e-06,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24401216208934784,
"step": 7680,
"valid_targets_mean": 4195.2,
"valid_targets_min": 908
},
{
"epoch": 5.861937452326468,
"grad_norm": 0.48355312631125696,
"learning_rate": 3.1394986261910352e-06,
"loss": 0.2874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2997702658176422,
"step": 7685,
"valid_targets_mean": 4433.9,
"valid_targets_min": 861
},
{
"epoch": 5.865751334858887,
"grad_norm": 0.48194084992498054,
"learning_rate": 3.1190692487375495e-06,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27790045738220215,
"step": 7690,
"valid_targets_mean": 4411.3,
"valid_targets_min": 1015
},
{
"epoch": 5.869565217391305,
"grad_norm": 0.4792526887514992,
"learning_rate": 3.0987009346977314e-06,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2566789984703064,
"step": 7695,
"valid_targets_mean": 4372.5,
"valid_targets_min": 730
},
{
"epoch": 5.8733790999237225,
"grad_norm": 0.5247160658839248,
"learning_rate": 3.078393757749898e-06,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2623863220214844,
"step": 7700,
"valid_targets_mean": 3699.5,
"valid_targets_min": 1064
},
{
"epoch": 5.87719298245614,
"grad_norm": 1.31309012160065,
"learning_rate": 3.0581477913512402e-06,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4631132185459137,
"step": 7705,
"valid_targets_mean": 924.8,
"valid_targets_min": 595
},
{
"epoch": 5.881006864988558,
"grad_norm": 0.5058652384548464,
"learning_rate": 3.0379631087375094e-06,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2527218163013458,
"step": 7710,
"valid_targets_mean": 3840.2,
"valid_targets_min": 1092
},
{
"epoch": 5.884820747520976,
"grad_norm": 0.48742105702963867,
"learning_rate": 3.0178397829227935e-06,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266996294260025,
"step": 7715,
"valid_targets_mean": 4231.3,
"valid_targets_min": 427
},
{
"epoch": 5.888634630053394,
"grad_norm": 0.4583551693813073,
"learning_rate": 2.997777886699216e-06,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21432173252105713,
"step": 7720,
"valid_targets_mean": 4182.4,
"valid_targets_min": 1484
},
{
"epoch": 5.892448512585812,
"grad_norm": 0.502015689504552,
"learning_rate": 2.9777774926367153e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22121445834636688,
"step": 7725,
"valid_targets_mean": 3529.1,
"valid_targets_min": 437
},
{
"epoch": 5.896262395118231,
"grad_norm": 0.45289837614009193,
"learning_rate": 2.957838673082729e-06,
"loss": 0.2777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.266684889793396,
"step": 7730,
"valid_targets_mean": 4576.7,
"valid_targets_min": 530
},
{
"epoch": 5.900076277650649,
"grad_norm": 0.48492694694900196,
"learning_rate": 2.9379615001619834e-06,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2345353364944458,
"step": 7735,
"valid_targets_mean": 3823.9,
"valid_targets_min": 1160
},
{
"epoch": 5.9038901601830664,
"grad_norm": 0.48980103900349786,
"learning_rate": 2.918146045776209e-06,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30960848927497864,
"step": 7740,
"valid_targets_mean": 4416.5,
"valid_targets_min": 705
},
{
"epoch": 5.907704042715484,
"grad_norm": 0.43775365194750415,
"learning_rate": 2.8983923816038628e-06,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3002133071422577,
"step": 7745,
"valid_targets_mean": 6101.7,
"valid_targets_min": 894
},
{
"epoch": 5.911517925247902,
"grad_norm": 0.4870360310259264,
"learning_rate": 2.8787005790999157e-06,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2697948217391968,
"step": 7750,
"valid_targets_mean": 4514.3,
"valid_targets_min": 1035
},
{
"epoch": 5.91533180778032,
"grad_norm": 0.4816571987450125,
"learning_rate": 2.859070709495535e-06,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2682059705257416,
"step": 7755,
"valid_targets_mean": 4110.0,
"valid_targets_min": 442
},
{
"epoch": 5.919145690312739,
"grad_norm": 0.4432390917784789,
"learning_rate": 2.83950284379789e-06,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29021620750427246,
"step": 7760,
"valid_targets_mean": 5378.8,
"valid_targets_min": 1510
},
{
"epoch": 5.922959572845157,
"grad_norm": 0.4890666324358443,
"learning_rate": 2.819997052789838e-06,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2582494914531708,
"step": 7765,
"valid_targets_mean": 4316.7,
"valid_targets_min": 434
},
{
"epoch": 5.926773455377575,
"grad_norm": 0.5424078222177492,
"learning_rate": 2.8005534070297092e-06,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644309997558594,
"step": 7770,
"valid_targets_mean": 4150.8,
"valid_targets_min": 1320
},
{
"epoch": 5.9305873379099925,
"grad_norm": 0.5196203991335387,
"learning_rate": 2.7811719768510205e-06,
"loss": 0.2662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2673504054546356,
"step": 7775,
"valid_targets_mean": 3580.5,
"valid_targets_min": 952
},
{
"epoch": 5.93440122044241,
"grad_norm": 0.4561509143165148,
"learning_rate": 2.761852832362255e-06,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27049699425697327,
"step": 7780,
"valid_targets_mean": 5493.5,
"valid_targets_min": 1451
},
{
"epoch": 5.938215102974828,
"grad_norm": 0.4723195240543183,
"learning_rate": 2.7425960434465794e-06,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2836945950984955,
"step": 7785,
"valid_targets_mean": 4640.3,
"valid_targets_min": 1688
},
{
"epoch": 5.942028985507246,
"grad_norm": 0.4902425169332125,
"learning_rate": 2.7234016797615947e-06,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24308143556118011,
"step": 7790,
"valid_targets_mean": 4298.5,
"valid_targets_min": 1232
},
{
"epoch": 5.945842868039664,
"grad_norm": 0.5029709069193514,
"learning_rate": 2.704269810739111e-06,
"loss": 0.2727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2596876919269562,
"step": 7795,
"valid_targets_mean": 4338.5,
"valid_targets_min": 1302
},
{
"epoch": 5.949656750572083,
"grad_norm": 0.482901901062868,
"learning_rate": 2.6852005055848506e-06,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2369847297668457,
"step": 7800,
"valid_targets_mean": 4154.8,
"valid_targets_min": 268
},
{
"epoch": 5.953470633104501,
"grad_norm": 0.45917913875581223,
"learning_rate": 2.6661938332782477e-06,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22529812157154083,
"step": 7805,
"valid_targets_mean": 4389.7,
"valid_targets_min": 1339
},
{
"epoch": 5.9572845156369185,
"grad_norm": 0.446736608750938,
"learning_rate": 2.6472498625721543e-06,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29567384719848633,
"step": 7810,
"valid_targets_mean": 4869.5,
"valid_targets_min": 504
},
{
"epoch": 5.961098398169336,
"grad_norm": 0.4351896685706992,
"learning_rate": 2.628368661992633e-06,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605706751346588,
"step": 7815,
"valid_targets_mean": 5280.7,
"valid_targets_min": 1398
},
{
"epoch": 5.964912280701754,
"grad_norm": 0.5221413256363302,
"learning_rate": 2.6095502998386636e-06,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2452189177274704,
"step": 7820,
"valid_targets_mean": 3603.2,
"valid_targets_min": 885
},
{
"epoch": 5.968726163234172,
"grad_norm": 0.4864253450865069,
"learning_rate": 2.5907948441819386e-06,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2926352620124817,
"step": 7825,
"valid_targets_mean": 4895.9,
"valid_targets_min": 1220
},
{
"epoch": 5.97254004576659,
"grad_norm": 0.47427799794774056,
"learning_rate": 2.5721023628665975e-06,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26650452613830566,
"step": 7830,
"valid_targets_mean": 5234.3,
"valid_targets_min": 1270
},
{
"epoch": 5.976353928299009,
"grad_norm": 0.49233848311869016,
"learning_rate": 2.5534729235089685e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766297459602356,
"step": 7835,
"valid_targets_mean": 4930.2,
"valid_targets_min": 1275
},
{
"epoch": 5.980167810831427,
"grad_norm": 0.47527502992187665,
"learning_rate": 2.5349065934973593e-06,
"loss": 0.265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2880236804485321,
"step": 7840,
"valid_targets_mean": 4734.1,
"valid_targets_min": 949
},
{
"epoch": 5.983981693363845,
"grad_norm": 0.559391570426309,
"learning_rate": 2.51640343999177e-06,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612583339214325,
"step": 7845,
"valid_targets_mean": 3851.5,
"valid_targets_min": 1105
},
{
"epoch": 5.987795575896262,
"grad_norm": 0.490844670179712,
"learning_rate": 2.4979635299236926e-06,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24493573606014252,
"step": 7850,
"valid_targets_mean": 4531.8,
"valid_targets_min": 1130
},
{
"epoch": 5.99160945842868,
"grad_norm": 0.45615276740640753,
"learning_rate": 2.47958692999583e-06,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24681413173675537,
"step": 7855,
"valid_targets_mean": 4569.3,
"valid_targets_min": 1345
},
{
"epoch": 5.995423340961098,
"grad_norm": 0.46989711303161386,
"learning_rate": 2.461273706681888e-06,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30878710746765137,
"step": 7860,
"valid_targets_mean": 4841.8,
"valid_targets_min": 1035
},
{
"epoch": 5.999237223493516,
"grad_norm": 1.3501461018957615,
"learning_rate": 2.443023926226309e-06,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49166861176490784,
"step": 7865,
"valid_targets_mean": 893.5,
"valid_targets_min": 437
},
{
"epoch": 6.003051106025935,
"grad_norm": 0.48062968179889437,
"learning_rate": 2.42483765464405e-06,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2480214685201645,
"step": 7870,
"valid_targets_mean": 5001.8,
"valid_targets_min": 1201
},
{
"epoch": 6.006864988558353,
"grad_norm": 0.4925864276970704,
"learning_rate": 2.406714957720342e-06,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2455272078514099,
"step": 7875,
"valid_targets_mean": 3972.8,
"valid_targets_min": 1183
},
{
"epoch": 6.010678871090771,
"grad_norm": 0.45788706813347363,
"learning_rate": 2.3886559010104326e-06,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22061456739902496,
"step": 7880,
"valid_targets_mean": 4328.2,
"valid_targets_min": 1027
},
{
"epoch": 6.0144927536231885,
"grad_norm": 0.47804510565235997,
"learning_rate": 2.3706605498393787e-06,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.278346449136734,
"step": 7885,
"valid_targets_mean": 3989.0,
"valid_targets_min": 1000
},
{
"epoch": 6.018306636155606,
"grad_norm": 0.5373527975549953,
"learning_rate": 2.352728969301783e-06,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867368161678314,
"step": 7890,
"valid_targets_mean": 4721.1,
"valid_targets_min": 1509
},
{
"epoch": 6.022120518688024,
"grad_norm": 0.47067460411820394,
"learning_rate": 2.334861224261582e-06,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30547037720680237,
"step": 7895,
"valid_targets_mean": 4757.3,
"valid_targets_min": 579
},
{
"epoch": 6.025934401220442,
"grad_norm": 0.5499976280698272,
"learning_rate": 2.317057379351786e-06,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520096004009247,
"step": 7900,
"valid_targets_mean": 3518.1,
"valid_targets_min": 703
},
{
"epoch": 6.02974828375286,
"grad_norm": 0.5062986771267566,
"learning_rate": 2.2993174989742762e-06,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28065720200538635,
"step": 7905,
"valid_targets_mean": 4128.1,
"valid_targets_min": 1327
},
{
"epoch": 6.033562166285279,
"grad_norm": 0.4308141740962017,
"learning_rate": 2.2816416472995374e-06,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22161316871643066,
"step": 7910,
"valid_targets_mean": 4659.9,
"valid_targets_min": 1388
},
{
"epoch": 6.037376048817697,
"grad_norm": 0.4557597674304979,
"learning_rate": 2.264029888266457e-06,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27463290095329285,
"step": 7915,
"valid_targets_mean": 4919.1,
"valid_targets_min": 825
},
{
"epoch": 6.0411899313501145,
"grad_norm": 0.47269435901277407,
"learning_rate": 2.246482285582077e-06,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2803293466567993,
"step": 7920,
"valid_targets_mean": 4718.7,
"valid_targets_min": 1230
},
{
"epoch": 6.045003813882532,
"grad_norm": 0.5042126557922357,
"learning_rate": 2.2289989027213555e-06,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23255133628845215,
"step": 7925,
"valid_targets_mean": 3776.7,
"valid_targets_min": 921
},
{
"epoch": 6.04881769641495,
"grad_norm": 0.46979730781076023,
"learning_rate": 2.2115798029269686e-06,
"loss": 0.2559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23931367695331573,
"step": 7930,
"valid_targets_mean": 5090.0,
"valid_targets_min": 947
},
{
"epoch": 6.052631578947368,
"grad_norm": 0.48482595112718446,
"learning_rate": 2.19422504920904e-06,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2659645974636078,
"step": 7935,
"valid_targets_mean": 4528.5,
"valid_targets_min": 711
},
{
"epoch": 6.056445461479786,
"grad_norm": 0.48749706923409686,
"learning_rate": 2.1769347043449486e-06,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688192129135132,
"step": 7940,
"valid_targets_mean": 4277.3,
"valid_targets_min": 917
},
{
"epoch": 6.060259344012205,
"grad_norm": 0.4644017044390465,
"learning_rate": 2.159708830879079e-06,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3060270845890045,
"step": 7945,
"valid_targets_mean": 4950.3,
"valid_targets_min": 1222
},
{
"epoch": 6.064073226544623,
"grad_norm": 0.4906142087642577,
"learning_rate": 2.142547491122613e-06,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784336507320404,
"step": 7950,
"valid_targets_mean": 4383.7,
"valid_targets_min": 531
},
{
"epoch": 6.0678871090770405,
"grad_norm": 0.5334373559306215,
"learning_rate": 2.1254507471532837e-06,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2708498239517212,
"step": 7955,
"valid_targets_mean": 3776.0,
"valid_targets_min": 1426
},
{
"epoch": 6.071700991609458,
"grad_norm": 0.4386048831830409,
"learning_rate": 2.108418660815161e-06,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562674582004547,
"step": 7960,
"valid_targets_mean": 5180.0,
"valid_targets_min": 1199
},
{
"epoch": 6.075514874141876,
"grad_norm": 0.4506492034727124,
"learning_rate": 2.091451293718445e-06,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26452645659446716,
"step": 7965,
"valid_targets_mean": 5052.3,
"valid_targets_min": 1547
},
{
"epoch": 6.079328756674294,
"grad_norm": 0.510818194605105,
"learning_rate": 2.0745487072392055e-06,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605459988117218,
"step": 7970,
"valid_targets_mean": 4058.3,
"valid_targets_min": 1098
},
{
"epoch": 6.083142639206712,
"grad_norm": 0.5633091083246478,
"learning_rate": 2.0577109625191994e-06,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31739693880081177,
"step": 7975,
"valid_targets_mean": 4121.5,
"valid_targets_min": 1049
},
{
"epoch": 6.086956521739131,
"grad_norm": 0.4949607184258331,
"learning_rate": 2.0409381204656166e-06,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2758539617061615,
"step": 7980,
"valid_targets_mean": 4030.7,
"valid_targets_min": 1407
},
{
"epoch": 6.090770404271549,
"grad_norm": 0.4933453751194869,
"learning_rate": 2.0242302417508887e-06,
"loss": 0.2726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3091985881328583,
"step": 7985,
"valid_targets_mean": 4677.6,
"valid_targets_min": 1302
},
{
"epoch": 6.094584286803967,
"grad_norm": 0.5208120342594886,
"learning_rate": 2.0075873868124374e-06,
"loss": 0.2658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2794772684574127,
"step": 7990,
"valid_targets_mean": 3504.0,
"valid_targets_min": 1117
},
{
"epoch": 6.0983981693363845,
"grad_norm": 0.47175364867379893,
"learning_rate": 1.991009615852493e-06,
"loss": 0.241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2372446060180664,
"step": 7995,
"valid_targets_mean": 4242.5,
"valid_targets_min": 1444
},
{
"epoch": 6.102212051868802,
"grad_norm": 0.47635870334783337,
"learning_rate": 1.9744969888378507e-06,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27210959792137146,
"step": 8000,
"valid_targets_mean": 3909.9,
"valid_targets_min": 725
},
{
"epoch": 6.10602593440122,
"grad_norm": 0.4897149992424955,
"learning_rate": 1.958049565499651e-06,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2656501829624176,
"step": 8005,
"valid_targets_mean": 3961.4,
"valid_targets_min": 1059
},
{
"epoch": 6.109839816933638,
"grad_norm": 0.49644054743886196,
"learning_rate": 1.9416674053331874e-06,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2539803385734558,
"step": 8010,
"valid_targets_mean": 4016.4,
"valid_targets_min": 981
},
{
"epoch": 6.113653699466057,
"grad_norm": 0.45827090956821354,
"learning_rate": 1.9253505675976637e-06,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2474987506866455,
"step": 8015,
"valid_targets_mean": 4490.6,
"valid_targets_min": 1025
},
{
"epoch": 6.117467581998475,
"grad_norm": 0.532130189641217,
"learning_rate": 1.9090991113160063e-06,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2694808542728424,
"step": 8020,
"valid_targets_mean": 3972.2,
"valid_targets_min": 419
},
{
"epoch": 6.121281464530893,
"grad_norm": 0.48835300034807266,
"learning_rate": 1.8929130952746221e-06,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953863739967346,
"step": 8025,
"valid_targets_mean": 4520.6,
"valid_targets_min": 972
},
{
"epoch": 6.1250953470633105,
"grad_norm": 0.666454281494576,
"learning_rate": 1.8767925780232165e-06,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2826656997203827,
"step": 8030,
"valid_targets_mean": 2480.5,
"valid_targets_min": 586
},
{
"epoch": 6.128909229595728,
"grad_norm": 0.44612454771434085,
"learning_rate": 1.8607376178745507e-06,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26308444142341614,
"step": 8035,
"valid_targets_mean": 4591.0,
"valid_targets_min": 1422
},
{
"epoch": 6.132723112128146,
"grad_norm": 0.4826682472062758,
"learning_rate": 1.8447482729042575e-06,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25889599323272705,
"step": 8040,
"valid_targets_mean": 4414.1,
"valid_targets_min": 802
},
{
"epoch": 6.136536994660564,
"grad_norm": 0.5109485985510919,
"learning_rate": 1.8288246009506205e-06,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3065207004547119,
"step": 8045,
"valid_targets_mean": 4242.8,
"valid_targets_min": 1180
},
{
"epoch": 6.140350877192983,
"grad_norm": 0.4985109163800362,
"learning_rate": 1.8129666596143525e-06,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521675229072571,
"step": 8050,
"valid_targets_mean": 4853.1,
"valid_targets_min": 1206
},
{
"epoch": 6.144164759725401,
"grad_norm": 0.4901306618532278,
"learning_rate": 1.7971745062584124e-06,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22057747840881348,
"step": 8055,
"valid_targets_mean": 3941.9,
"valid_targets_min": 771
},
{
"epoch": 6.147978642257819,
"grad_norm": 0.466196185868008,
"learning_rate": 1.7814481980077715e-06,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25427624583244324,
"step": 8060,
"valid_targets_mean": 4745.8,
"valid_targets_min": 1322
},
{
"epoch": 6.1517925247902365,
"grad_norm": 0.589441832405084,
"learning_rate": 1.7657877917492317e-06,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23444731533527374,
"step": 8065,
"valid_targets_mean": 2909.0,
"valid_targets_min": 957
},
{
"epoch": 6.155606407322654,
"grad_norm": 0.47368781222899703,
"learning_rate": 1.750193344131197e-06,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25396108627319336,
"step": 8070,
"valid_targets_mean": 4479.5,
"valid_targets_min": 1510
},
{
"epoch": 6.159420289855072,
"grad_norm": 0.4450780056952024,
"learning_rate": 1.734664911563486e-06,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27313801646232605,
"step": 8075,
"valid_targets_mean": 4954.8,
"valid_targets_min": 1624
},
{
"epoch": 6.16323417238749,
"grad_norm": 0.48910138411977444,
"learning_rate": 1.7192025502171228e-06,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22142617404460907,
"step": 8080,
"valid_targets_mean": 4333.7,
"valid_targets_min": 861
},
{
"epoch": 6.167048054919908,
"grad_norm": 0.48170174354701956,
"learning_rate": 1.7038063160241192e-06,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2735546827316284,
"step": 8085,
"valid_targets_mean": 4614.9,
"valid_targets_min": 1063
},
{
"epoch": 6.170861937452327,
"grad_norm": 0.4854645935841226,
"learning_rate": 1.6884762646773033e-06,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21456031501293182,
"step": 8090,
"valid_targets_mean": 3828.2,
"valid_targets_min": 1029
},
{
"epoch": 6.174675819984745,
"grad_norm": 0.5193233563509866,
"learning_rate": 1.673212451630084e-06,
"loss": 0.2487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23842072486877441,
"step": 8095,
"valid_targets_mean": 4357.5,
"valid_targets_min": 1403
},
{
"epoch": 6.178489702517163,
"grad_norm": 0.46674004165837635,
"learning_rate": 1.658014932096279e-06,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2715775668621063,
"step": 8100,
"valid_targets_mean": 4991.6,
"valid_targets_min": 1196
},
{
"epoch": 6.18230358504958,
"grad_norm": 0.4395211421948986,
"learning_rate": 1.6428837610498871e-06,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22720418870449066,
"step": 8105,
"valid_targets_mean": 4861.5,
"valid_targets_min": 1284
},
{
"epoch": 6.186117467581998,
"grad_norm": 0.4452513509591422,
"learning_rate": 1.6278189932249254e-06,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2689577043056488,
"step": 8110,
"valid_targets_mean": 5120.7,
"valid_targets_min": 1014
},
{
"epoch": 6.189931350114416,
"grad_norm": 0.46574167515943166,
"learning_rate": 1.6128206831151882e-06,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2244655340909958,
"step": 8115,
"valid_targets_mean": 5011.2,
"valid_targets_min": 447
},
{
"epoch": 6.193745232646834,
"grad_norm": 0.4524835605573105,
"learning_rate": 1.5978888849740859e-06,
"loss": 0.2717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3081461489200592,
"step": 8120,
"valid_targets_mean": 5331.9,
"valid_targets_min": 780
},
{
"epoch": 6.197559115179253,
"grad_norm": 0.4590513523291447,
"learning_rate": 1.5830236528144393e-06,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569229304790497,
"step": 8125,
"valid_targets_mean": 4720.4,
"valid_targets_min": 1129
},
{
"epoch": 6.201372997711671,
"grad_norm": 0.49349920923341595,
"learning_rate": 1.5682250404082644e-06,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.239435076713562,
"step": 8130,
"valid_targets_mean": 4415.0,
"valid_targets_min": 1096
},
{
"epoch": 6.205186880244089,
"grad_norm": 0.4835711092547128,
"learning_rate": 1.5534931012866073e-06,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28328731656074524,
"step": 8135,
"valid_targets_mean": 5174.2,
"valid_targets_min": 728
},
{
"epoch": 6.2090007627765065,
"grad_norm": 0.469441730252239,
"learning_rate": 1.5388278887393248e-06,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25443562865257263,
"step": 8140,
"valid_targets_mean": 4408.7,
"valid_targets_min": 1133
},
{
"epoch": 6.212814645308924,
"grad_norm": 0.5158535576190626,
"learning_rate": 1.5242294558149185e-06,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2312001734972,
"step": 8145,
"valid_targets_mean": 3657.9,
"valid_targets_min": 437
},
{
"epoch": 6.216628527841342,
"grad_norm": 0.553127176309931,
"learning_rate": 1.5096978553203113e-06,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30233147740364075,
"step": 8150,
"valid_targets_mean": 3667.6,
"valid_targets_min": 924
},
{
"epoch": 6.22044241037376,
"grad_norm": 0.48795105972995456,
"learning_rate": 1.4952331398206887e-06,
"loss": 0.2551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20166908204555511,
"step": 8155,
"valid_targets_mean": 3893.6,
"valid_targets_min": 259
},
{
"epoch": 6.224256292906179,
"grad_norm": 0.4551850427448832,
"learning_rate": 1.480835361639279e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29251715540885925,
"step": 8160,
"valid_targets_mean": 5185.8,
"valid_targets_min": 877
},
{
"epoch": 6.228070175438597,
"grad_norm": 0.4373875864246496,
"learning_rate": 1.4665045728571882e-06,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2827031910419464,
"step": 8165,
"valid_targets_mean": 4935.5,
"valid_targets_min": 1328
},
{
"epoch": 6.231884057971015,
"grad_norm": 0.4731594753863616,
"learning_rate": 1.4522408253132025e-06,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2341814786195755,
"step": 8170,
"valid_targets_mean": 4701.2,
"valid_targets_min": 1053
},
{
"epoch": 6.2356979405034325,
"grad_norm": 0.5056521083824401,
"learning_rate": 1.4380441706035853e-06,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2901335060596466,
"step": 8175,
"valid_targets_mean": 4571.2,
"valid_targets_min": 1179
},
{
"epoch": 6.23951182303585,
"grad_norm": 0.4462897818037207,
"learning_rate": 1.4239146600819242e-06,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3010201156139374,
"step": 8180,
"valid_targets_mean": 5367.0,
"valid_targets_min": 1576
},
{
"epoch": 6.243325705568268,
"grad_norm": 0.4739465545428769,
"learning_rate": 1.4098523448589085e-06,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2658689618110657,
"step": 8185,
"valid_targets_mean": 4513.1,
"valid_targets_min": 1114
},
{
"epoch": 6.247139588100686,
"grad_norm": 0.5728493918682379,
"learning_rate": 1.395857275802177e-06,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27031782269477844,
"step": 8190,
"valid_targets_mean": 3563.4,
"valid_targets_min": 1235
},
{
"epoch": 6.250953470633105,
"grad_norm": 1.3211397960464706,
"learning_rate": 1.3819295035361058e-06,
"loss": 0.4452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4577854573726654,
"step": 8195,
"valid_targets_mean": 904.5,
"valid_targets_min": 535
},
{
"epoch": 6.254767353165523,
"grad_norm": 0.45784081080185146,
"learning_rate": 1.3680690784416518e-06,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2961617410182953,
"step": 8200,
"valid_targets_mean": 5407.8,
"valid_targets_min": 967
},
{
"epoch": 6.258581235697941,
"grad_norm": 0.46998051084917214,
"learning_rate": 1.3542760506561425e-06,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2554444372653961,
"step": 8205,
"valid_targets_mean": 4629.0,
"valid_targets_min": 942
},
{
"epoch": 6.2623951182303585,
"grad_norm": 0.5663180562707967,
"learning_rate": 1.3405504700731187e-06,
"loss": 0.2623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27484387159347534,
"step": 8210,
"valid_targets_mean": 3721.8,
"valid_targets_min": 1239
},
{
"epoch": 6.266209000762776,
"grad_norm": 0.5004847910957235,
"learning_rate": 1.3268923863421446e-06,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23197054862976074,
"step": 8215,
"valid_targets_mean": 3964.7,
"valid_targets_min": 1498
},
{
"epoch": 6.270022883295194,
"grad_norm": 0.5283419533962973,
"learning_rate": 1.3133018488686178e-06,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2701933979988098,
"step": 8220,
"valid_targets_mean": 3617.1,
"valid_targets_min": 1119
},
{
"epoch": 6.273836765827612,
"grad_norm": 0.42300879977149064,
"learning_rate": 1.2997789068136179e-06,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26573577523231506,
"step": 8225,
"valid_targets_mean": 5194.5,
"valid_targets_min": 506
},
{
"epoch": 6.27765064836003,
"grad_norm": 0.49915292987260135,
"learning_rate": 1.2863236090936914e-06,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2291276901960373,
"step": 8230,
"valid_targets_mean": 3968.0,
"valid_targets_min": 1443
},
{
"epoch": 6.281464530892449,
"grad_norm": 0.4814365648176594,
"learning_rate": 1.2729360043807115e-06,
"loss": 0.266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2721117436885834,
"step": 8235,
"valid_targets_mean": 4163.8,
"valid_targets_min": 1016
},
{
"epoch": 6.285278413424867,
"grad_norm": 0.4584146356424767,
"learning_rate": 1.2596161411016761e-06,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678042948246002,
"step": 8240,
"valid_targets_mean": 4794.0,
"valid_targets_min": 1423
},
{
"epoch": 6.289092295957285,
"grad_norm": 0.5086223883422862,
"learning_rate": 1.2463640674385458e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28021755814552307,
"step": 8245,
"valid_targets_mean": 4818.8,
"valid_targets_min": 1828
},
{
"epoch": 6.2929061784897025,
"grad_norm": 0.49136585702620744,
"learning_rate": 1.233179831328062e-06,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23660731315612793,
"step": 8250,
"valid_targets_mean": 3634.5,
"valid_targets_min": 1127
},
{
"epoch": 6.29672006102212,
"grad_norm": 0.53884264245829,
"learning_rate": 1.2200634804615818e-06,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22205261886119843,
"step": 8255,
"valid_targets_mean": 3687.9,
"valid_targets_min": 436
},
{
"epoch": 6.300533943554538,
"grad_norm": 0.48947114458130897,
"learning_rate": 1.207015062284902e-06,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2426479309797287,
"step": 8260,
"valid_targets_mean": 3859.2,
"valid_targets_min": 1237
},
{
"epoch": 6.304347826086957,
"grad_norm": 0.4567633292464014,
"learning_rate": 1.1940346239980816e-06,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27313122153282166,
"step": 8265,
"valid_targets_mean": 4842.5,
"valid_targets_min": 1110
},
{
"epoch": 6.308161708619375,
"grad_norm": 0.4995871522429241,
"learning_rate": 1.1811222125552768e-06,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2652623951435089,
"step": 8270,
"valid_targets_mean": 3800.2,
"valid_targets_min": 637
},
{
"epoch": 6.311975591151793,
"grad_norm": 0.5468633135839358,
"learning_rate": 1.1682778746645652e-06,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27540352940559387,
"step": 8275,
"valid_targets_mean": 4041.3,
"valid_targets_min": 931
},
{
"epoch": 6.315789473684211,
"grad_norm": 0.5313235594410799,
"learning_rate": 1.1555016567877985e-06,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2507777214050293,
"step": 8280,
"valid_targets_mean": 3945.6,
"valid_targets_min": 872
},
{
"epoch": 6.3196033562166285,
"grad_norm": 0.630105166821167,
"learning_rate": 1.1427936051403977e-06,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21576042473316193,
"step": 8285,
"valid_targets_mean": 2889.1,
"valid_targets_min": 734
},
{
"epoch": 6.323417238749046,
"grad_norm": 0.4653648737455474,
"learning_rate": 1.1301537656912175e-06,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28202584385871887,
"step": 8290,
"valid_targets_mean": 4816.4,
"valid_targets_min": 1084
},
{
"epoch": 6.327231121281464,
"grad_norm": 0.5166525372254579,
"learning_rate": 1.1175821841623712e-06,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2229657620191574,
"step": 8295,
"valid_targets_mean": 3587.4,
"valid_targets_min": 1143
},
{
"epoch": 6.331045003813882,
"grad_norm": 0.4833110267231946,
"learning_rate": 1.1050789060290534e-06,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2544369101524353,
"step": 8300,
"valid_targets_mean": 4295.7,
"valid_targets_min": 1226
},
{
"epoch": 6.334858886346301,
"grad_norm": 0.5346116958118867,
"learning_rate": 1.0926439765193898e-06,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22066330909729004,
"step": 8305,
"valid_targets_mean": 3234.5,
"valid_targets_min": 279
},
{
"epoch": 6.338672768878719,
"grad_norm": 0.5235801033937233,
"learning_rate": 1.080277440614268e-06,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30774369835853577,
"step": 8310,
"valid_targets_mean": 4542.8,
"valid_targets_min": 1109
},
{
"epoch": 6.342486651411137,
"grad_norm": 0.48340978591910344,
"learning_rate": 1.0679793430471763e-06,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2984248399734497,
"step": 8315,
"valid_targets_mean": 4806.4,
"valid_targets_min": 837
},
{
"epoch": 6.3463005339435545,
"grad_norm": 0.4839962726354207,
"learning_rate": 1.055749728304034e-06,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24378865957260132,
"step": 8320,
"valid_targets_mean": 4818.2,
"valid_targets_min": 1553
},
{
"epoch": 6.350114416475972,
"grad_norm": 0.48547846148092877,
"learning_rate": 1.0435886406230522e-06,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29921552538871765,
"step": 8325,
"valid_targets_mean": 4799.2,
"valid_targets_min": 720
},
{
"epoch": 6.35392829900839,
"grad_norm": 0.4826226506202875,
"learning_rate": 1.031496123994542e-06,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2462555170059204,
"step": 8330,
"valid_targets_mean": 5017.3,
"valid_targets_min": 1309
},
{
"epoch": 6.357742181540808,
"grad_norm": 0.5422536322203456,
"learning_rate": 1.0194722221607823e-06,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23788587749004364,
"step": 8335,
"valid_targets_mean": 4561.3,
"valid_targets_min": 1150
},
{
"epoch": 6.361556064073227,
"grad_norm": 0.4923820461404623,
"learning_rate": 1.0075169786158544e-06,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28204765915870667,
"step": 8340,
"valid_targets_mean": 4894.0,
"valid_targets_min": 773
},
{
"epoch": 6.365369946605645,
"grad_norm": 0.5055193746390563,
"learning_rate": 9.956304366054682e-07,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22904770076274872,
"step": 8345,
"valid_targets_mean": 4334.6,
"valid_targets_min": 1197
},
{
"epoch": 6.369183829138063,
"grad_norm": 0.4496958094342579,
"learning_rate": 9.838126391268377e-07,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.210269495844841,
"step": 8350,
"valid_targets_mean": 4551.9,
"valid_targets_min": 900
},
{
"epoch": 6.372997711670481,
"grad_norm": 0.42807004915669006,
"learning_rate": 9.720636289284878e-07,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618262469768524,
"step": 8355,
"valid_targets_mean": 5323.6,
"valid_targets_min": 942
},
{
"epoch": 6.3768115942028984,
"grad_norm": 0.5431535643885081,
"learning_rate": 9.603834485101381e-07,
"loss": 0.3526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27988871932029724,
"step": 8360,
"valid_targets_mean": 3949.1,
"valid_targets_min": 1206
},
{
"epoch": 6.380625476735316,
"grad_norm": 0.5151995528629127,
"learning_rate": 9.487721401225137e-07,
"loss": 0.2761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27052268385887146,
"step": 8365,
"valid_targets_mean": 3915.1,
"valid_targets_min": 977
},
{
"epoch": 6.384439359267734,
"grad_norm": 0.4529826695504075,
"learning_rate": 9.372297457672231e-07,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260204017162323,
"step": 8370,
"valid_targets_mean": 5037.4,
"valid_targets_min": 268
},
{
"epoch": 6.388253241800153,
"grad_norm": 0.476253361507551,
"learning_rate": 9.257563071965792e-07,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2602754533290863,
"step": 8375,
"valid_targets_mean": 4367.5,
"valid_targets_min": 1371
},
{
"epoch": 6.392067124332571,
"grad_norm": 0.4609825503411047,
"learning_rate": 9.143518659134676e-07,
"loss": 0.2583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2888159453868866,
"step": 8380,
"valid_targets_mean": 4771.2,
"valid_targets_min": 1556
},
{
"epoch": 6.395881006864989,
"grad_norm": 0.4615228842972912,
"learning_rate": 9.030164631711957e-07,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2512037456035614,
"step": 8385,
"valid_targets_mean": 4216.5,
"valid_targets_min": 1181
},
{
"epoch": 6.399694889397407,
"grad_norm": 0.4783617043494897,
"learning_rate": 8.917501399733219e-07,
"loss": 0.2624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31296250224113464,
"step": 8390,
"valid_targets_mean": 5034.9,
"valid_targets_min": 1488
},
{
"epoch": 6.4035087719298245,
"grad_norm": 0.4554766870515671,
"learning_rate": 8.805529370735378e-07,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24182575941085815,
"step": 8395,
"valid_targets_mean": 4342.8,
"valid_targets_min": 1501
},
{
"epoch": 6.407322654462242,
"grad_norm": 0.49378415215503346,
"learning_rate": 8.694248949754991e-07,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.227997824549675,
"step": 8400,
"valid_targets_mean": 3916.5,
"valid_targets_min": 1133
},
{
"epoch": 6.41113653699466,
"grad_norm": 0.5026431344870141,
"learning_rate": 8.583660539326911e-07,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28937292098999023,
"step": 8405,
"valid_targets_mean": 4306.0,
"valid_targets_min": 1533
},
{
"epoch": 6.414950419527079,
"grad_norm": 0.4789425873369109,
"learning_rate": 8.473764539482654e-07,
"loss": 0.2613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24315117299556732,
"step": 8410,
"valid_targets_mean": 4329.9,
"valid_targets_min": 1148
},
{
"epoch": 6.418764302059497,
"grad_norm": 0.44425281965231356,
"learning_rate": 8.364561347749279e-07,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2703532874584198,
"step": 8415,
"valid_targets_mean": 5093.1,
"valid_targets_min": 360
},
{
"epoch": 6.422578184591915,
"grad_norm": 0.4504345015374403,
"learning_rate": 8.256051359147554e-07,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3007253408432007,
"step": 8420,
"valid_targets_mean": 5373.0,
"valid_targets_min": 338
},
{
"epoch": 6.426392067124333,
"grad_norm": 0.49903685482553933,
"learning_rate": 8.14823496619086e-07,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22903098165988922,
"step": 8425,
"valid_targets_mean": 3829.9,
"valid_targets_min": 1259
},
{
"epoch": 6.4302059496567505,
"grad_norm": 0.5012525211737092,
"learning_rate": 8.041112558883557e-07,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2882510721683502,
"step": 8430,
"valid_targets_mean": 4023.9,
"valid_targets_min": 1054
},
{
"epoch": 6.434019832189168,
"grad_norm": 0.5099919723651475,
"learning_rate": 7.934684524719683e-07,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2546488344669342,
"step": 8435,
"valid_targets_mean": 4289.2,
"valid_targets_min": 426
},
{
"epoch": 6.437833714721586,
"grad_norm": 0.4654407478835626,
"learning_rate": 7.828951248681505e-07,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24574923515319824,
"step": 8440,
"valid_targets_mean": 4327.0,
"valid_targets_min": 1432
},
{
"epoch": 6.441647597254004,
"grad_norm": 0.4612414886820737,
"learning_rate": 7.723913113238146e-07,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19901114702224731,
"step": 8445,
"valid_targets_mean": 3979.3,
"valid_targets_min": 1352
},
{
"epoch": 6.445461479786423,
"grad_norm": 0.5342280212284785,
"learning_rate": 7.619570498344209e-07,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2609269618988037,
"step": 8450,
"valid_targets_mean": 3531.6,
"valid_targets_min": 1374
},
{
"epoch": 6.449275362318841,
"grad_norm": 0.5046481339850619,
"learning_rate": 7.51592378143835e-07,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2273874282836914,
"step": 8455,
"valid_targets_mean": 4145.7,
"valid_targets_min": 894
},
{
"epoch": 6.453089244851259,
"grad_norm": 0.5046175752574743,
"learning_rate": 7.412973337441997e-07,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24711179733276367,
"step": 8460,
"valid_targets_mean": 3831.0,
"valid_targets_min": 970
},
{
"epoch": 6.4569031273836766,
"grad_norm": 0.5089035875525534,
"learning_rate": 7.310719538757927e-07,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24454724788665771,
"step": 8465,
"valid_targets_mean": 4124.6,
"valid_targets_min": 392
},
{
"epoch": 6.460717009916094,
"grad_norm": 0.46416602732457035,
"learning_rate": 7.209162755268928e-07,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25188159942626953,
"step": 8470,
"valid_targets_mean": 4515.6,
"valid_targets_min": 1454
},
{
"epoch": 6.464530892448512,
"grad_norm": 0.4499441231883731,
"learning_rate": 7.108303354336544e-07,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28176894783973694,
"step": 8475,
"valid_targets_mean": 5149.5,
"valid_targets_min": 1237
},
{
"epoch": 6.46834477498093,
"grad_norm": 0.8435636493276955,
"learning_rate": 7.008141700799531e-07,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30925872921943665,
"step": 8480,
"valid_targets_mean": 5316.2,
"valid_targets_min": 2132
},
{
"epoch": 6.472158657513349,
"grad_norm": 0.4849813862200653,
"learning_rate": 6.90867815697287e-07,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25278136134147644,
"step": 8485,
"valid_targets_mean": 4548.2,
"valid_targets_min": 1677
},
{
"epoch": 6.475972540045767,
"grad_norm": 0.46129805261149925,
"learning_rate": 6.809913082646113e-07,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25576576590538025,
"step": 8490,
"valid_targets_mean": 4950.3,
"valid_targets_min": 917
},
{
"epoch": 6.479786422578185,
"grad_norm": 0.626575600377628,
"learning_rate": 6.711846835082325e-07,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2927459180355072,
"step": 8495,
"valid_targets_mean": 4252.6,
"valid_targets_min": 1206
},
{
"epoch": 6.483600305110603,
"grad_norm": 0.5192502057353363,
"learning_rate": 6.614479769016657e-07,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.238042950630188,
"step": 8500,
"valid_targets_mean": 3840.0,
"valid_targets_min": 828
},
{
"epoch": 6.4874141876430205,
"grad_norm": 0.4570662293657686,
"learning_rate": 6.517812236655152e-07,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25383320450782776,
"step": 8505,
"valid_targets_mean": 4537.5,
"valid_targets_min": 1112
},
{
"epoch": 6.491228070175438,
"grad_norm": 0.5727447284814335,
"learning_rate": 6.421844587673365e-07,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26463204622268677,
"step": 8510,
"valid_targets_mean": 5026.8,
"valid_targets_min": 1170
},
{
"epoch": 6.495041952707856,
"grad_norm": 0.47162991186897507,
"learning_rate": 6.326577169215231e-07,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26361772418022156,
"step": 8515,
"valid_targets_mean": 5021.2,
"valid_targets_min": 952
},
{
"epoch": 6.498855835240275,
"grad_norm": 1.3899956907574107,
"learning_rate": 6.232010325891735e-07,
"loss": 0.3976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4216398000717163,
"step": 8520,
"valid_targets_mean": 790.2,
"valid_targets_min": 583
},
{
"epoch": 6.502669717772693,
"grad_norm": 0.4694331442372106,
"learning_rate": 6.1381443997796e-07,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26441314816474915,
"step": 8525,
"valid_targets_mean": 4803.4,
"valid_targets_min": 839
},
{
"epoch": 6.506483600305111,
"grad_norm": 0.5044007854322652,
"learning_rate": 6.044979730420198e-07,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21473665535449982,
"step": 8530,
"valid_targets_mean": 3430.1,
"valid_targets_min": 613
},
{
"epoch": 6.510297482837529,
"grad_norm": 0.5403224413072797,
"learning_rate": 5.952516654818197e-07,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2875039875507355,
"step": 8535,
"valid_targets_mean": 3952.5,
"valid_targets_min": 1128
},
{
"epoch": 6.5141113653699465,
"grad_norm": 0.43010869493650594,
"learning_rate": 5.86075550744043e-07,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2839283049106598,
"step": 8540,
"valid_targets_mean": 6165.4,
"valid_targets_min": 1886
},
{
"epoch": 6.517925247902364,
"grad_norm": 0.442055090560568,
"learning_rate": 5.769696620214582e-07,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.264087051153183,
"step": 8545,
"valid_targets_mean": 5245.8,
"valid_targets_min": 1233
},
{
"epoch": 6.521739130434782,
"grad_norm": 0.5380539845910357,
"learning_rate": 5.679340322528126e-07,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26377812027931213,
"step": 8550,
"valid_targets_mean": 4610.8,
"valid_targets_min": 1676
},
{
"epoch": 6.525553012967201,
"grad_norm": 0.4692104990180008,
"learning_rate": 5.589686941226991e-07,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25884586572647095,
"step": 8555,
"valid_targets_mean": 4473.1,
"valid_targets_min": 1297
},
{
"epoch": 6.529366895499619,
"grad_norm": 0.5133962979482154,
"learning_rate": 5.500736800614492e-07,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25123903155326843,
"step": 8560,
"valid_targets_mean": 4083.8,
"valid_targets_min": 1411
},
{
"epoch": 6.533180778032037,
"grad_norm": 0.6838627983702491,
"learning_rate": 5.412490222450095e-07,
"loss": 0.2606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2431752234697342,
"step": 8565,
"valid_targets_mean": 4096.5,
"valid_targets_min": 1368
},
{
"epoch": 6.536994660564455,
"grad_norm": 0.4805436149387146,
"learning_rate": 5.324947525948254e-07,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567639648914337,
"step": 8570,
"valid_targets_mean": 4516.2,
"valid_targets_min": 1309
},
{
"epoch": 6.5408085430968725,
"grad_norm": 0.454962448002056,
"learning_rate": 5.238109027777283e-07,
"loss": 0.2638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2514365613460541,
"step": 8575,
"valid_targets_mean": 4904.3,
"valid_targets_min": 1127
},
{
"epoch": 6.54462242562929,
"grad_norm": 0.4793575688943854,
"learning_rate": 5.151975042058244e-07,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24711287021636963,
"step": 8580,
"valid_targets_mean": 4137.0,
"valid_targets_min": 806
},
{
"epoch": 6.548436308161708,
"grad_norm": 0.4801693917051084,
"learning_rate": 5.066545880363638e-07,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27172407507896423,
"step": 8585,
"valid_targets_mean": 4103.1,
"valid_targets_min": 818
},
{
"epoch": 6.552250190694126,
"grad_norm": 0.4288887079935217,
"learning_rate": 4.981821851716562e-07,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2810297906398773,
"step": 8590,
"valid_targets_mean": 5950.1,
"valid_targets_min": 1457
},
{
"epoch": 6.556064073226545,
"grad_norm": 0.447417911964289,
"learning_rate": 4.897803262589285e-07,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2641676962375641,
"step": 8595,
"valid_targets_mean": 4733.5,
"valid_targets_min": 1069
},
{
"epoch": 6.559877955758963,
"grad_norm": 0.5130635758947727,
"learning_rate": 4.814490416902451e-07,
"loss": 0.2646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28340986371040344,
"step": 8600,
"valid_targets_mean": 4399.0,
"valid_targets_min": 946
},
{
"epoch": 6.563691838291381,
"grad_norm": 0.48860800754653405,
"learning_rate": 4.731883616023658e-07,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23458512127399445,
"step": 8605,
"valid_targets_mean": 4400.2,
"valid_targets_min": 1848
},
{
"epoch": 6.567505720823799,
"grad_norm": 0.4486519842249868,
"learning_rate": 4.649983158766658e-07,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2617599070072174,
"step": 8610,
"valid_targets_mean": 5128.7,
"valid_targets_min": 1255
},
{
"epoch": 6.5713196033562165,
"grad_norm": 0.4613068465948873,
"learning_rate": 4.568789341390023e-07,
"loss": 0.2755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2712768614292145,
"step": 8615,
"valid_targets_mean": 5012.1,
"valid_targets_min": 613
},
{
"epoch": 6.575133485888634,
"grad_norm": 0.5413147396470408,
"learning_rate": 4.4883024575963055e-07,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25305524468421936,
"step": 8620,
"valid_targets_mean": 3542.5,
"valid_targets_min": 1116
},
{
"epoch": 6.578947368421053,
"grad_norm": 0.47959906526653856,
"learning_rate": 4.40852279853079e-07,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3105383813381195,
"step": 8625,
"valid_targets_mean": 4613.8,
"valid_targets_min": 1458
},
{
"epoch": 6.582761250953471,
"grad_norm": 0.5194487070204782,
"learning_rate": 4.3294506527805425e-07,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2872951626777649,
"step": 8630,
"valid_targets_mean": 4815.3,
"valid_targets_min": 496
},
{
"epoch": 6.586575133485889,
"grad_norm": 0.5190367669623117,
"learning_rate": 4.2510863063734087e-07,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22017668187618256,
"step": 8635,
"valid_targets_mean": 4139.2,
"valid_targets_min": 337
},
{
"epoch": 6.590389016018307,
"grad_norm": 0.4694041403487881,
"learning_rate": 4.173430042776749e-07,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22927264869213104,
"step": 8640,
"valid_targets_mean": 3980.7,
"valid_targets_min": 873
},
{
"epoch": 6.594202898550725,
"grad_norm": 0.5066127295615718,
"learning_rate": 4.0964821428967516e-07,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3201106786727905,
"step": 8645,
"valid_targets_mean": 4447.3,
"valid_targets_min": 959
},
{
"epoch": 6.5980167810831425,
"grad_norm": 0.4723010578935397,
"learning_rate": 4.020242885077097e-07,
"loss": 0.2481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768709659576416,
"step": 8650,
"valid_targets_mean": 4583.0,
"valid_targets_min": 1399
},
{
"epoch": 6.60183066361556,
"grad_norm": 0.4707835769721507,
"learning_rate": 3.944712545098206e-07,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25435635447502136,
"step": 8655,
"valid_targets_mean": 4408.1,
"valid_targets_min": 737
},
{
"epoch": 6.605644546147978,
"grad_norm": 0.46052357212783235,
"learning_rate": 3.8698913961760396e-07,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2501215934753418,
"step": 8660,
"valid_targets_mean": 4504.2,
"valid_targets_min": 1246
},
{
"epoch": 6.609458428680397,
"grad_norm": 0.5958375550063665,
"learning_rate": 3.795779708961278e-07,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24585700035095215,
"step": 8665,
"valid_targets_mean": 3603.8,
"valid_targets_min": 983
},
{
"epoch": 6.613272311212815,
"grad_norm": 0.44664158445770247,
"learning_rate": 3.722377751538187e-07,
"loss": 0.2616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540818154811859,
"step": 8670,
"valid_targets_mean": 5331.1,
"valid_targets_min": 1746
},
{
"epoch": 6.617086193745233,
"grad_norm": 0.4249148441892047,
"learning_rate": 3.6496857894237735e-07,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22584165632724762,
"step": 8675,
"valid_targets_mean": 4769.4,
"valid_targets_min": 468
},
{
"epoch": 6.620900076277651,
"grad_norm": 0.4972869734589808,
"learning_rate": 3.5777040855668356e-07,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2749437391757965,
"step": 8680,
"valid_targets_mean": 4438.9,
"valid_targets_min": 956
},
{
"epoch": 6.6247139588100685,
"grad_norm": 1.3596860424548278,
"learning_rate": 3.506432900346779e-07,
"loss": 0.3819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43016377091407776,
"step": 8685,
"valid_targets_mean": 843.3,
"valid_targets_min": 648
},
{
"epoch": 6.628527841342486,
"grad_norm": 0.4567195254428743,
"learning_rate": 3.4358724915730667e-07,
"loss": 0.3047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2491716593503952,
"step": 8690,
"valid_targets_mean": 4938.8,
"valid_targets_min": 541
},
{
"epoch": 6.632341723874904,
"grad_norm": 0.46756573873403356,
"learning_rate": 3.366023114483885e-07,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27434781193733215,
"step": 8695,
"valid_targets_mean": 4699.2,
"valid_targets_min": 1459
},
{
"epoch": 6.636155606407323,
"grad_norm": 0.48085087252841974,
"learning_rate": 3.2968850217455216e-07,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2507885694503784,
"step": 8700,
"valid_targets_mean": 4554.4,
"valid_targets_min": 1345
},
{
"epoch": 6.639969488939741,
"grad_norm": 0.4305286168328577,
"learning_rate": 3.228458463451256e-07,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27329325675964355,
"step": 8705,
"valid_targets_mean": 5775.1,
"valid_targets_min": 1627
},
{
"epoch": 6.643783371472159,
"grad_norm": 0.4335818665288777,
"learning_rate": 3.1607436871206043e-07,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23998205363750458,
"step": 8710,
"valid_targets_mean": 5298.2,
"valid_targets_min": 965
},
{
"epoch": 6.647597254004577,
"grad_norm": 0.5511616117071578,
"learning_rate": 3.0937409376982975e-07,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.279064804315567,
"step": 8715,
"valid_targets_mean": 4210.8,
"valid_targets_min": 1120
},
{
"epoch": 6.651411136536995,
"grad_norm": 0.49819383972885306,
"learning_rate": 3.0274504575534603e-07,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2777750790119171,
"step": 8720,
"valid_targets_mean": 4362.2,
"valid_targets_min": 526
},
{
"epoch": 6.655225019069412,
"grad_norm": 0.48970859152321294,
"learning_rate": 2.9618724864787896e-07,
"loss": 0.2701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29505303502082825,
"step": 8725,
"valid_targets_mean": 4475.5,
"valid_targets_min": 1178
},
{
"epoch": 6.65903890160183,
"grad_norm": 0.5365787991296255,
"learning_rate": 2.8970072616895326e-07,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23452679812908173,
"step": 8730,
"valid_targets_mean": 3625.1,
"valid_targets_min": 452
},
{
"epoch": 6.662852784134248,
"grad_norm": 0.4616599271545656,
"learning_rate": 2.8328550178227556e-07,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2593431770801544,
"step": 8735,
"valid_targets_mean": 4466.4,
"valid_targets_min": 1113
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.6455949927025287,
"learning_rate": 2.7694159869364525e-07,
"loss": 0.2628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934395372867584,
"step": 8740,
"valid_targets_mean": 4677.8,
"valid_targets_min": 711
},
{
"epoch": 6.670480549199085,
"grad_norm": 0.45477101496916916,
"learning_rate": 2.706690398508727e-07,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759816646575928,
"step": 8745,
"valid_targets_mean": 5200.2,
"valid_targets_min": 1401
},
{
"epoch": 6.674294431731503,
"grad_norm": 0.4579561242619741,
"learning_rate": 2.644678479436924e-07,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2668015956878662,
"step": 8750,
"valid_targets_mean": 4637.0,
"valid_targets_min": 1224
},
{
"epoch": 6.678108314263921,
"grad_norm": 0.5483706726448575,
"learning_rate": 2.5833804540368545e-07,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2324792742729187,
"step": 8755,
"valid_targets_mean": 4207.0,
"valid_targets_min": 709
},
{
"epoch": 6.6819221967963385,
"grad_norm": 0.4616777266359128,
"learning_rate": 2.522796544041928e-07,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2218731790781021,
"step": 8760,
"valid_targets_mean": 4335.9,
"valid_targets_min": 510
},
{
"epoch": 6.685736079328756,
"grad_norm": 0.5125443947686906,
"learning_rate": 2.4629269686024195e-07,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2388933151960373,
"step": 8765,
"valid_targets_mean": 3919.2,
"valid_targets_min": 1000
},
{
"epoch": 6.689549961861175,
"grad_norm": 0.5000080999041109,
"learning_rate": 2.4037719442846497e-07,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521762251853943,
"step": 8770,
"valid_targets_mean": 4245.3,
"valid_targets_min": 1029
},
{
"epoch": 6.693363844393593,
"grad_norm": 0.4614214393159042,
"learning_rate": 2.345331685070118e-07,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2523350417613983,
"step": 8775,
"valid_targets_mean": 5094.4,
"valid_targets_min": 1841
},
{
"epoch": 6.697177726926011,
"grad_norm": 0.49785359302904225,
"learning_rate": 2.2876064023549028e-07,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25749513506889343,
"step": 8780,
"valid_targets_mean": 3709.2,
"valid_targets_min": 423
},
{
"epoch": 6.700991609458429,
"grad_norm": 0.5382263987761529,
"learning_rate": 2.2305963049487068e-07,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28535568714141846,
"step": 8785,
"valid_targets_mean": 4224.0,
"valid_targets_min": 1141
},
{
"epoch": 6.704805491990847,
"grad_norm": 0.515491071106708,
"learning_rate": 2.1743015990742576e-07,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2274818867444992,
"step": 8790,
"valid_targets_mean": 3546.7,
"valid_targets_min": 892
},
{
"epoch": 6.7086193745232645,
"grad_norm": 0.4904593792098621,
"learning_rate": 2.1187224883664425e-07,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23734210431575775,
"step": 8795,
"valid_targets_mean": 4233.8,
"valid_targets_min": 291
},
{
"epoch": 6.712433257055682,
"grad_norm": 0.4764836214210563,
"learning_rate": 2.063859173871685e-07,
"loss": 0.2516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25665369629859924,
"step": 8800,
"valid_targets_mean": 4348.4,
"valid_targets_min": 1155
},
{
"epoch": 6.7162471395881,
"grad_norm": 0.5364539012840841,
"learning_rate": 2.009711854047125e-07,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26761090755462646,
"step": 8805,
"valid_targets_mean": 3480.5,
"valid_targets_min": 454
},
{
"epoch": 6.720061022120519,
"grad_norm": 0.43633373903725753,
"learning_rate": 1.956280724759907e-07,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615395486354828,
"step": 8810,
"valid_targets_mean": 5068.1,
"valid_targets_min": 1043
},
{
"epoch": 6.723874904652937,
"grad_norm": 0.5009990477100269,
"learning_rate": 1.903565979286559e-07,
"loss": 0.2437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2951163947582245,
"step": 8815,
"valid_targets_mean": 4381.7,
"valid_targets_min": 984
},
{
"epoch": 6.727688787185355,
"grad_norm": 0.4884652809586842,
"learning_rate": 1.8515678083121936e-07,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24884463846683502,
"step": 8820,
"valid_targets_mean": 4959.0,
"valid_targets_min": 688
},
{
"epoch": 6.731502669717773,
"grad_norm": 0.5180850457811853,
"learning_rate": 1.8002863999298624e-07,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2687952220439911,
"step": 8825,
"valid_targets_mean": 4047.2,
"valid_targets_min": 924
},
{
"epoch": 6.7353165522501905,
"grad_norm": 0.4893545194267149,
"learning_rate": 1.749721939639848e-07,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23527388274669647,
"step": 8830,
"valid_targets_mean": 4457.8,
"valid_targets_min": 1307
},
{
"epoch": 6.739130434782608,
"grad_norm": 0.5488105797549294,
"learning_rate": 1.6998746103490838e-07,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29204466938972473,
"step": 8835,
"valid_targets_mean": 4550.1,
"valid_targets_min": 1258
},
{
"epoch": 6.742944317315027,
"grad_norm": 0.47929795689362814,
"learning_rate": 1.650744592370357e-07,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23622556030750275,
"step": 8840,
"valid_targets_mean": 4238.9,
"valid_targets_min": 1358
},
{
"epoch": 6.746758199847445,
"grad_norm": 0.48193540879637353,
"learning_rate": 1.602332063421752e-07,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542840540409088,
"step": 8845,
"valid_targets_mean": 4354.8,
"valid_targets_min": 1124
},
{
"epoch": 6.750572082379863,
"grad_norm": 1.6083685967329227,
"learning_rate": 1.5546371986259856e-07,
"loss": 0.3409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4540012776851654,
"step": 8850,
"valid_targets_mean": 798.7,
"valid_targets_min": 662
},
{
"epoch": 6.754385964912281,
"grad_norm": 0.4479560061910448,
"learning_rate": 1.5076601705097171e-07,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26199549436569214,
"step": 8855,
"valid_targets_mean": 4903.4,
"valid_targets_min": 1525
},
{
"epoch": 6.758199847444699,
"grad_norm": 0.5167509652707176,
"learning_rate": 1.4614011490030833e-07,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21811072528362274,
"step": 8860,
"valid_targets_mean": 3528.3,
"valid_targets_min": 1120
},
{
"epoch": 6.762013729977117,
"grad_norm": 0.5466567892986032,
"learning_rate": 1.4158603014388317e-07,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22469651699066162,
"step": 8865,
"valid_targets_mean": 3092.0,
"valid_targets_min": 1160
},
{
"epoch": 6.7658276125095345,
"grad_norm": 0.5078871078005721,
"learning_rate": 1.3710377925520102e-07,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2852909564971924,
"step": 8870,
"valid_targets_mean": 4437.4,
"valid_targets_min": 1185
},
{
"epoch": 6.769641495041952,
"grad_norm": 0.4667897106491802,
"learning_rate": 1.3269337844790565e-07,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30474594235420227,
"step": 8875,
"valid_targets_mean": 5781.1,
"valid_targets_min": 1382
},
{
"epoch": 6.77345537757437,
"grad_norm": 0.45330866220580385,
"learning_rate": 1.283548436757509e-07,
"loss": 0.2428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2104359120130539,
"step": 8880,
"valid_targets_mean": 5018.0,
"valid_targets_min": 1360
},
{
"epoch": 6.777269260106789,
"grad_norm": 0.47262441892560764,
"learning_rate": 1.2408819063252531e-07,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537544071674347,
"step": 8885,
"valid_targets_mean": 4318.1,
"valid_targets_min": 1018
},
{
"epoch": 6.781083142639207,
"grad_norm": 0.4688379872758674,
"learning_rate": 1.1989343475199422e-07,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2471754550933838,
"step": 8890,
"valid_targets_mean": 4464.4,
"valid_targets_min": 671
},
{
"epoch": 6.784897025171625,
"grad_norm": 0.46613067717925505,
"learning_rate": 1.1577059120785994e-07,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24822942912578583,
"step": 8895,
"valid_targets_mean": 4436.9,
"valid_targets_min": 1155
},
{
"epoch": 6.788710907704043,
"grad_norm": 0.4246933283721545,
"learning_rate": 1.1171967491368396e-07,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2612958252429962,
"step": 8900,
"valid_targets_mean": 5156.3,
"valid_targets_min": 1447
},
{
"epoch": 6.7925247902364605,
"grad_norm": 0.488048889984009,
"learning_rate": 1.0774070052285367e-07,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2610219419002533,
"step": 8905,
"valid_targets_mean": 4220.4,
"valid_targets_min": 834
},
{
"epoch": 6.796338672768878,
"grad_norm": 0.45744606793079273,
"learning_rate": 1.0383368242852021e-07,
"loss": 0.2592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2370743304491043,
"step": 8910,
"valid_targets_mean": 4227.2,
"valid_targets_min": 867
},
{
"epoch": 6.800152555301297,
"grad_norm": 0.44106979768649596,
"learning_rate": 9.999863476354289e-08,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2570864260196686,
"step": 8915,
"valid_targets_mean": 4943.4,
"valid_targets_min": 871
},
{
"epoch": 6.803966437833715,
"grad_norm": 0.4655514026103222,
"learning_rate": 9.623557140044481e-08,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2311626523733139,
"step": 8920,
"valid_targets_mean": 4024.0,
"valid_targets_min": 1455
},
{
"epoch": 6.807780320366133,
"grad_norm": 0.4400894039415246,
"learning_rate": 9.254450595136188e-08,
"loss": 0.2736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2622435986995697,
"step": 8925,
"valid_targets_mean": 5075.9,
"valid_targets_min": 1286
},
{
"epoch": 6.811594202898551,
"grad_norm": 0.4603549740303837,
"learning_rate": 8.892545176799161e-08,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24099206924438477,
"step": 8930,
"valid_targets_mean": 4275.4,
"valid_targets_min": 1051
},
{
"epoch": 6.815408085430969,
"grad_norm": 0.45744142908056945,
"learning_rate": 8.537842194153767e-08,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27880170941352844,
"step": 8935,
"valid_targets_mean": 4513.8,
"valid_targets_min": 1277
},
{
"epoch": 6.8192219679633865,
"grad_norm": 0.4933018643513688,
"learning_rate": 8.190342930268325e-08,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20053613185882568,
"step": 8940,
"valid_targets_mean": 3789.4,
"valid_targets_min": 1465
},
{
"epoch": 6.823035850495804,
"grad_norm": 0.4545423866647215,
"learning_rate": 7.850048642151775e-08,
"loss": 0.2471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23181915283203125,
"step": 8945,
"valid_targets_mean": 4632.9,
"valid_targets_min": 1292
},
{
"epoch": 6.826849733028222,
"grad_norm": 0.4902945311689018,
"learning_rate": 7.516960560751462e-08,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2742360532283783,
"step": 8950,
"valid_targets_mean": 3948.9,
"valid_targets_min": 993
},
{
"epoch": 6.830663615560641,
"grad_norm": 0.4498076800376056,
"learning_rate": 7.19107989094736e-08,
"loss": 0.269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26429128646850586,
"step": 8955,
"valid_targets_mean": 4785.0,
"valid_targets_min": 986
},
{
"epoch": 6.834477498093059,
"grad_norm": 0.4649434981304079,
"learning_rate": 6.872407811547855e-08,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24602733552455902,
"step": 8960,
"valid_targets_mean": 4312.8,
"valid_targets_min": 1685
},
{
"epoch": 6.838291380625477,
"grad_norm": 0.4584733518995103,
"learning_rate": 6.560945475285741e-08,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534709572792053,
"step": 8965,
"valid_targets_mean": 4685.2,
"valid_targets_min": 1185
},
{
"epoch": 6.842105263157895,
"grad_norm": 0.5254599972627705,
"learning_rate": 6.256694008814679e-08,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3134000301361084,
"step": 8970,
"valid_targets_mean": 4030.5,
"valid_targets_min": 1191
},
{
"epoch": 6.845919145690313,
"grad_norm": 0.4796585637484957,
"learning_rate": 5.9596545127036385e-08,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22937195003032684,
"step": 8975,
"valid_targets_mean": 4679.3,
"valid_targets_min": 1334
},
{
"epoch": 6.8497330282227304,
"grad_norm": 0.5194624420495947,
"learning_rate": 5.669828061433791e-08,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2806025445461273,
"step": 8980,
"valid_targets_mean": 4014.6,
"valid_targets_min": 991
},
{
"epoch": 6.853546910755149,
"grad_norm": 0.4705120799985797,
"learning_rate": 5.387215703395177e-08,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28963637351989746,
"step": 8985,
"valid_targets_mean": 5085.6,
"valid_targets_min": 1168
},
{
"epoch": 6.857360793287567,
"grad_norm": 0.5819980638824224,
"learning_rate": 5.111818460881379e-08,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26628777384757996,
"step": 8990,
"valid_targets_mean": 4100.6,
"valid_targets_min": 927
},
{
"epoch": 6.861174675819985,
"grad_norm": 0.4388922287444261,
"learning_rate": 4.843637330087525e-08,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28951165080070496,
"step": 8995,
"valid_targets_mean": 5574.4,
"valid_targets_min": 713
},
{
"epoch": 6.864988558352403,
"grad_norm": 0.5130442634203314,
"learning_rate": 4.582673281105621e-08,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22083990275859833,
"step": 9000,
"valid_targets_mean": 3968.1,
"valid_targets_min": 523
},
{
"epoch": 6.868802440884821,
"grad_norm": 0.519678895479751,
"learning_rate": 4.3289272579212226e-08,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769645154476166,
"step": 9005,
"valid_targets_mean": 3708.4,
"valid_targets_min": 704
},
{
"epoch": 6.872616323417239,
"grad_norm": 0.48803210237269884,
"learning_rate": 4.082400178409884e-08,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24909156560897827,
"step": 9010,
"valid_targets_mean": 4402.6,
"valid_targets_min": 1164
},
{
"epoch": 6.8764302059496565,
"grad_norm": 1.310490122044137,
"learning_rate": 3.843092934334714e-08,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42711055278778076,
"step": 9015,
"valid_targets_mean": 874.1,
"valid_targets_min": 602
},
{
"epoch": 6.880244088482074,
"grad_norm": 0.5194420306200203,
"learning_rate": 3.6110063913419314e-08,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.270808607339859,
"step": 9020,
"valid_targets_mean": 3739.3,
"valid_targets_min": 886
},
{
"epoch": 6.884057971014493,
"grad_norm": 0.4523455589120904,
"learning_rate": 3.386141388958652e-08,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24892598390579224,
"step": 9025,
"valid_targets_mean": 4797.2,
"valid_targets_min": 858
},
{
"epoch": 6.887871853546911,
"grad_norm": 0.48287864804733494,
"learning_rate": 3.1684987405891096e-08,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28461983799934387,
"step": 9030,
"valid_targets_mean": 4661.2,
"valid_targets_min": 844
},
{
"epoch": 6.891685736079329,
"grad_norm": 0.4721016692882381,
"learning_rate": 2.9580792335126562e-08,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28126761317253113,
"step": 9035,
"valid_targets_mean": 5096.3,
"valid_targets_min": 1602
},
{
"epoch": 6.895499618611747,
"grad_norm": 0.4841861982217126,
"learning_rate": 2.7548836288797675e-08,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28836727142333984,
"step": 9040,
"valid_targets_mean": 4471.4,
"valid_targets_min": 473
},
{
"epoch": 6.899313501144165,
"grad_norm": 0.682082195562495,
"learning_rate": 2.5589126617102666e-08,
"loss": 0.2515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2549896538257599,
"step": 9045,
"valid_targets_mean": 3695.0,
"valid_targets_min": 1341
},
{
"epoch": 6.9031273836765825,
"grad_norm": 0.4430357315125749,
"learning_rate": 2.3701670408904365e-08,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2781337797641754,
"step": 9050,
"valid_targets_mean": 5056.7,
"valid_targets_min": 1742
},
{
"epoch": 6.906941266209,
"grad_norm": 0.4961634791637363,
"learning_rate": 2.1886474491699116e-08,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2650142014026642,
"step": 9055,
"valid_targets_mean": 4381.1,
"valid_targets_min": 1526
},
{
"epoch": 6.910755148741419,
"grad_norm": 0.4766223024157269,
"learning_rate": 2.014354543159458e-08,
"loss": 0.2597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24406524002552032,
"step": 9060,
"valid_targets_mean": 4142.5,
"valid_targets_min": 380
},
{
"epoch": 6.914569031273837,
"grad_norm": 0.5041571799311416,
"learning_rate": 1.847288953329418e-08,
"loss": 0.2621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2359909564256668,
"step": 9065,
"valid_targets_mean": 4001.7,
"valid_targets_min": 1419
},
{
"epoch": 6.918382913806255,
"grad_norm": 0.4689832398936382,
"learning_rate": 1.6874512840063806e-08,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23846976459026337,
"step": 9070,
"valid_targets_mean": 4615.5,
"valid_targets_min": 1134
},
{
"epoch": 6.922196796338673,
"grad_norm": 0.4215746760654066,
"learning_rate": 1.5348421133711822e-08,
"loss": 0.2671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2647766172885895,
"step": 9075,
"valid_targets_mean": 5416.6,
"valid_targets_min": 1373
},
{
"epoch": 6.926010678871091,
"grad_norm": 0.47434945452469185,
"learning_rate": 1.3894619934571307e-08,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696935534477234,
"step": 9080,
"valid_targets_mean": 4957.5,
"valid_targets_min": 1516
},
{
"epoch": 6.9298245614035086,
"grad_norm": 0.5140704574961166,
"learning_rate": 1.2513114501482294e-08,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29723748564720154,
"step": 9085,
"valid_targets_mean": 4311.6,
"valid_targets_min": 1513
},
{
"epoch": 6.933638443935926,
"grad_norm": 0.44704021411153305,
"learning_rate": 1.1203909831762893e-08,
"loss": 0.2594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2530190050601959,
"step": 9090,
"valid_targets_mean": 4857.2,
"valid_targets_min": 447
},
{
"epoch": 6.937452326468344,
"grad_norm": 0.4606405386761923,
"learning_rate": 9.967010661204868e-09,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2141771763563156,
"step": 9095,
"valid_targets_mean": 4249.3,
"valid_targets_min": 1203
},
{
"epoch": 6.941266209000763,
"grad_norm": 0.4346601417829936,
"learning_rate": 8.802421464040312e-09,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532062828540802,
"step": 9100,
"valid_targets_mean": 5482.1,
"valid_targets_min": 1125
},
{
"epoch": 6.945080091533181,
"grad_norm": 0.5138564719167915,
"learning_rate": 7.710146452941658e-09,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25881847739219666,
"step": 9105,
"valid_targets_mean": 4072.5,
"valid_targets_min": 1354
},
{
"epoch": 6.948893974065599,
"grad_norm": 0.5443768694531692,
"learning_rate": 6.690189578999473e-09,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22537367045879364,
"step": 9110,
"valid_targets_mean": 3369.6,
"valid_targets_min": 827
},
{
"epoch": 6.952707856598017,
"grad_norm": 0.5109364822190952,
"learning_rate": 5.742554531700251e-09,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23135484755039215,
"step": 9115,
"valid_targets_mean": 3833.6,
"valid_targets_min": 883
},
{
"epoch": 6.956521739130435,
"grad_norm": 0.46466195137513505,
"learning_rate": 4.8672447389286335e-09,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24387897551059723,
"step": 9120,
"valid_targets_mean": 4876.5,
"valid_targets_min": 1284
},
{
"epoch": 6.9603356216628525,
"grad_norm": 0.5300251711812586,
"learning_rate": 4.064263366942989e-09,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2824271023273468,
"step": 9125,
"valid_targets_mean": 4544.0,
"valid_targets_min": 1082
},
{
"epoch": 6.964149504195271,
"grad_norm": 0.4806841321702372,
"learning_rate": 3.333613320368745e-09,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22269928455352783,
"step": 9130,
"valid_targets_mean": 4612.7,
"valid_targets_min": 1333
},
{
"epoch": 6.967963386727689,
"grad_norm": 0.5416974736321651,
"learning_rate": 2.6752972421895117e-09,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2618859112262726,
"step": 9135,
"valid_targets_mean": 3495.5,
"valid_targets_min": 620
},
{
"epoch": 6.971777269260107,
"grad_norm": 0.459511556904324,
"learning_rate": 2.0893175137293163e-09,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535509169101715,
"step": 9140,
"valid_targets_mean": 4382.7,
"valid_targets_min": 505
},
{
"epoch": 6.975591151792525,
"grad_norm": 0.48437983570830595,
"learning_rate": 1.5756762546570437e-09,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2759089469909668,
"step": 9145,
"valid_targets_mean": 3919.9,
"valid_targets_min": 1075
},
{
"epoch": 6.979405034324943,
"grad_norm": 0.49415357039663277,
"learning_rate": 1.1343753229642317e-09,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23885183036327362,
"step": 9150,
"valid_targets_mean": 3753.2,
"valid_targets_min": 753
},
{
"epoch": 6.983218916857361,
"grad_norm": 0.5461652605442551,
"learning_rate": 7.654163149717342e-10,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2608436048030853,
"step": 9155,
"valid_targets_mean": 3563.1,
"valid_targets_min": 521
},
{
"epoch": 6.9870327993897785,
"grad_norm": 0.545724031102777,
"learning_rate": 4.688005653163963e-10,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27841898798942566,
"step": 9160,
"valid_targets_mean": 4363.7,
"valid_targets_min": 447
},
{
"epoch": 6.990846681922196,
"grad_norm": 0.4705636484040312,
"learning_rate": 2.44529146942174e-10,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812120020389557,
"step": 9165,
"valid_targets_mean": 4790.8,
"valid_targets_min": 915
},
{
"epoch": 6.994660564454615,
"grad_norm": 0.5291991743545336,
"learning_rate": 9.260287111123589e-11,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2218012809753418,
"step": 9170,
"valid_targets_mean": 3817.0,
"valid_targets_min": 1202
},
{
"epoch": 6.998474446987033,
"grad_norm": 1.5469628469507675,
"learning_rate": 1.3022287386199594e-11,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4602835476398468,
"step": 9175,
"valid_targets_mean": 780.0,
"valid_targets_min": 493
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4288143217563629,
"step": 9177,
"total_flos": 4631781651513344.0,
"train_loss": 0.31498055520031176,
"train_runtime": 65837.0719,
"train_samples_per_second": 3.345,
"train_steps_per_second": 0.139,
"valid_targets_mean": 858.8,
"valid_targets_min": 497
}
],
"logging_steps": 5,
"max_steps": 9177,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 4631781651513344.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}