Files
exp_tas_optimal_combined_tr…/trainer_state.json
ModelHub XC e4c310e9e0 初始化项目,由ModelHub XC社区提供模型
Model: laion/exp_tas_optimal_combined_traces
Source: Original Platform
2026-06-01 00:43:12 +08:00

8760 lines
243 KiB
JSON

{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 3962,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008841732979664015,
"grad_norm": 16.43759145601646,
"learning_rate": 4.030226700251889e-07,
"loss": 0.9913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4914407730102539,
"step": 5,
"valid_targets_mean": 3975.9,
"valid_targets_min": 247
},
{
"epoch": 0.01768346595932803,
"grad_norm": 17.984303937601393,
"learning_rate": 9.068010075566751e-07,
"loss": 1.09,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5117278099060059,
"step": 10,
"valid_targets_mean": 2293.8,
"valid_targets_min": 269
},
{
"epoch": 0.026525198938992044,
"grad_norm": 17.430054844624365,
"learning_rate": 1.4105793450881613e-06,
"loss": 1.0664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48715919256210327,
"step": 15,
"valid_targets_mean": 3742.1,
"valid_targets_min": 610
},
{
"epoch": 0.03536693191865606,
"grad_norm": 13.157985816910156,
"learning_rate": 1.9143576826196476e-06,
"loss": 1.0244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48635387420654297,
"step": 20,
"valid_targets_mean": 3909.9,
"valid_targets_min": 431
},
{
"epoch": 0.04420866489832007,
"grad_norm": 7.039459793103061,
"learning_rate": 2.4181360201511335e-06,
"loss": 0.9523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5950973629951477,
"step": 25,
"valid_targets_mean": 4854.0,
"valid_targets_min": 1882
},
{
"epoch": 0.05305039787798409,
"grad_norm": 4.37502689672069,
"learning_rate": 2.92191435768262e-06,
"loss": 0.8882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4377889037132263,
"step": 30,
"valid_targets_mean": 3904.2,
"valid_targets_min": 558
},
{
"epoch": 0.0618921308576481,
"grad_norm": 2.2984916066569143,
"learning_rate": 3.425692695214106e-06,
"loss": 0.8596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3730544149875641,
"step": 35,
"valid_targets_mean": 4253.4,
"valid_targets_min": 403
},
{
"epoch": 0.07073386383731212,
"grad_norm": 1.749502864868188,
"learning_rate": 3.9294710327455925e-06,
"loss": 0.8071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37501755356788635,
"step": 40,
"valid_targets_mean": 3304.0,
"valid_targets_min": 463
},
{
"epoch": 0.07957559681697612,
"grad_norm": 1.4297619383408833,
"learning_rate": 4.433249370277078e-06,
"loss": 0.7654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2531526982784271,
"step": 45,
"valid_targets_mean": 2443.0,
"valid_targets_min": 536
},
{
"epoch": 0.08841732979664015,
"grad_norm": 1.2107916623135075,
"learning_rate": 4.937027707808565e-06,
"loss": 0.7661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26174238324165344,
"step": 50,
"valid_targets_mean": 1962.4,
"valid_targets_min": 419
},
{
"epoch": 0.09725906277630415,
"grad_norm": 1.1177863382586022,
"learning_rate": 5.440806045340051e-06,
"loss": 0.7088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2441769391298294,
"step": 55,
"valid_targets_mean": 1324.0,
"valid_targets_min": 387
},
{
"epoch": 0.10610079575596817,
"grad_norm": 1.3240485836200855,
"learning_rate": 5.944584382871537e-06,
"loss": 0.7418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45804762840270996,
"step": 60,
"valid_targets_mean": 2281.6,
"valid_targets_min": 299
},
{
"epoch": 0.11494252873563218,
"grad_norm": 0.9887476322800939,
"learning_rate": 6.448362720403023e-06,
"loss": 0.7786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3559702932834625,
"step": 65,
"valid_targets_mean": 2576.8,
"valid_targets_min": 979
},
{
"epoch": 0.1237842617152962,
"grad_norm": 0.8313614619463878,
"learning_rate": 6.9521410579345095e-06,
"loss": 0.7667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32869428396224976,
"step": 70,
"valid_targets_mean": 2681.1,
"valid_targets_min": 559
},
{
"epoch": 0.13262599469496023,
"grad_norm": 1.2928448614693209,
"learning_rate": 7.455919395465996e-06,
"loss": 0.7316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4524758458137512,
"step": 75,
"valid_targets_mean": 2086.6,
"valid_targets_min": 305
},
{
"epoch": 0.14146772767462423,
"grad_norm": 0.9039110142607959,
"learning_rate": 7.959697732997482e-06,
"loss": 0.7216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41223078966140747,
"step": 80,
"valid_targets_mean": 2522.0,
"valid_targets_min": 418
},
{
"epoch": 0.15030946065428824,
"grad_norm": 1.1531713116573887,
"learning_rate": 8.463476070528968e-06,
"loss": 0.6962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31595444679260254,
"step": 85,
"valid_targets_mean": 2714.1,
"valid_targets_min": 435
},
{
"epoch": 0.15915119363395225,
"grad_norm": 0.7279561415401078,
"learning_rate": 8.967254408060454e-06,
"loss": 0.7161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45249640941619873,
"step": 90,
"valid_targets_mean": 4901.6,
"valid_targets_min": 628
},
{
"epoch": 0.16799292661361626,
"grad_norm": 0.7881029215112537,
"learning_rate": 9.47103274559194e-06,
"loss": 0.706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31990885734558105,
"step": 95,
"valid_targets_mean": 2807.6,
"valid_targets_min": 268
},
{
"epoch": 0.1768346595932803,
"grad_norm": 0.7086656082236659,
"learning_rate": 9.974811083123427e-06,
"loss": 0.6583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.270596981048584,
"step": 100,
"valid_targets_mean": 2979.0,
"valid_targets_min": 722
},
{
"epoch": 0.1856763925729443,
"grad_norm": 0.8874052957709296,
"learning_rate": 1.0478589420654912e-05,
"loss": 0.6697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24225851893424988,
"step": 105,
"valid_targets_mean": 1624.0,
"valid_targets_min": 356
},
{
"epoch": 0.1945181255526083,
"grad_norm": 0.8682741626307907,
"learning_rate": 1.0982367758186399e-05,
"loss": 0.6139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38384777307510376,
"step": 110,
"valid_targets_mean": 2603.8,
"valid_targets_min": 504
},
{
"epoch": 0.20335985853227231,
"grad_norm": 0.7893830841438993,
"learning_rate": 1.1486146095717885e-05,
"loss": 0.6651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3616026043891907,
"step": 115,
"valid_targets_mean": 5229.1,
"valid_targets_min": 648
},
{
"epoch": 0.21220159151193635,
"grad_norm": 0.8435136463460109,
"learning_rate": 1.1989924433249371e-05,
"loss": 0.7056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35327407717704773,
"step": 120,
"valid_targets_mean": 3276.9,
"valid_targets_min": 557
},
{
"epoch": 0.22104332449160036,
"grad_norm": 0.8326030890475514,
"learning_rate": 1.2493702770780859e-05,
"loss": 0.6327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29393622279167175,
"step": 125,
"valid_targets_mean": 3015.4,
"valid_targets_min": 1786
},
{
"epoch": 0.22988505747126436,
"grad_norm": 0.5791447791458552,
"learning_rate": 1.2997481108312344e-05,
"loss": 0.6477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31838011741638184,
"step": 130,
"valid_targets_mean": 4220.1,
"valid_targets_min": 704
},
{
"epoch": 0.23872679045092837,
"grad_norm": 0.7833412749104234,
"learning_rate": 1.350125944584383e-05,
"loss": 0.6188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3599586486816406,
"step": 135,
"valid_targets_mean": 3493.0,
"valid_targets_min": 562
},
{
"epoch": 0.2475685234305924,
"grad_norm": 0.6930132817315054,
"learning_rate": 1.4005037783375318e-05,
"loss": 0.6729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3735961318016052,
"step": 140,
"valid_targets_mean": 3788.9,
"valid_targets_min": 1905
},
{
"epoch": 0.2564102564102564,
"grad_norm": 0.6900812305728492,
"learning_rate": 1.4508816120906802e-05,
"loss": 0.5868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2900860905647278,
"step": 145,
"valid_targets_mean": 3795.8,
"valid_targets_min": 881
},
{
"epoch": 0.26525198938992045,
"grad_norm": 0.668587653722343,
"learning_rate": 1.5012594458438288e-05,
"loss": 0.6371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23740538954734802,
"step": 150,
"valid_targets_mean": 3166.9,
"valid_targets_min": 1434
},
{
"epoch": 0.27409372236958446,
"grad_norm": 0.6857654288467885,
"learning_rate": 1.5516372795969776e-05,
"loss": 0.6119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.49299874901771545,
"step": 155,
"valid_targets_mean": 5421.9,
"valid_targets_min": 2002
},
{
"epoch": 0.28293545534924847,
"grad_norm": 0.7011124721817551,
"learning_rate": 1.602015113350126e-05,
"loss": 0.6135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2792966365814209,
"step": 160,
"valid_targets_mean": 3557.1,
"valid_targets_min": 307
},
{
"epoch": 0.2917771883289125,
"grad_norm": 0.7181568311757064,
"learning_rate": 1.6523929471032747e-05,
"loss": 0.6163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3261794447898865,
"step": 165,
"valid_targets_mean": 3577.6,
"valid_targets_min": 1825
},
{
"epoch": 0.3006189213085765,
"grad_norm": 0.6383260621735827,
"learning_rate": 1.7027707808564233e-05,
"loss": 0.6208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2658522427082062,
"step": 170,
"valid_targets_mean": 4118.4,
"valid_targets_min": 554
},
{
"epoch": 0.3094606542882405,
"grad_norm": 0.873748558543848,
"learning_rate": 1.753148614609572e-05,
"loss": 0.6582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27786922454833984,
"step": 175,
"valid_targets_mean": 2538.9,
"valid_targets_min": 411
},
{
"epoch": 0.3183023872679045,
"grad_norm": 0.7741218070486372,
"learning_rate": 1.8035264483627205e-05,
"loss": 0.661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3300468325614929,
"step": 180,
"valid_targets_mean": 3783.0,
"valid_targets_min": 716
},
{
"epoch": 0.3271441202475685,
"grad_norm": 0.7153501560841902,
"learning_rate": 1.8539042821158694e-05,
"loss": 0.613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30669140815734863,
"step": 185,
"valid_targets_mean": 2831.9,
"valid_targets_min": 663
},
{
"epoch": 0.3359858532272325,
"grad_norm": 0.8733028655615769,
"learning_rate": 1.9042821158690177e-05,
"loss": 0.6091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4316086769104004,
"step": 190,
"valid_targets_mean": 3605.1,
"valid_targets_min": 411
},
{
"epoch": 0.3448275862068966,
"grad_norm": 0.8909617924940159,
"learning_rate": 1.9546599496221663e-05,
"loss": 0.7227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29832324385643005,
"step": 195,
"valid_targets_mean": 2360.1,
"valid_targets_min": 1393
},
{
"epoch": 0.3536693191865606,
"grad_norm": 0.7676692325940812,
"learning_rate": 2.0050377833753152e-05,
"loss": 0.6012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.349293053150177,
"step": 200,
"valid_targets_mean": 3419.4,
"valid_targets_min": 532
},
{
"epoch": 0.3625110521662246,
"grad_norm": 0.6966533272502462,
"learning_rate": 2.0554156171284634e-05,
"loss": 0.597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34834665060043335,
"step": 205,
"valid_targets_mean": 4089.6,
"valid_targets_min": 2040
},
{
"epoch": 0.3713527851458886,
"grad_norm": 0.9033467905392003,
"learning_rate": 2.1057934508816124e-05,
"loss": 0.6181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3413087725639343,
"step": 210,
"valid_targets_mean": 2691.6,
"valid_targets_min": 1037
},
{
"epoch": 0.3801945181255526,
"grad_norm": 1.709473285401154,
"learning_rate": 2.156171284634761e-05,
"loss": 0.6068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2899201512336731,
"step": 215,
"valid_targets_mean": 3180.1,
"valid_targets_min": 317
},
{
"epoch": 0.3890362511052166,
"grad_norm": 0.7521210734695193,
"learning_rate": 2.2065491183879092e-05,
"loss": 0.5964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3372876048088074,
"step": 220,
"valid_targets_mean": 3230.0,
"valid_targets_min": 383
},
{
"epoch": 0.3978779840848806,
"grad_norm": 0.8333691908125227,
"learning_rate": 2.256926952141058e-05,
"loss": 0.6837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3745100498199463,
"step": 225,
"valid_targets_mean": 2964.1,
"valid_targets_min": 761
},
{
"epoch": 0.40671971706454463,
"grad_norm": 0.6656840184265772,
"learning_rate": 2.3073047858942067e-05,
"loss": 0.603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19232776761054993,
"step": 230,
"valid_targets_mean": 2728.2,
"valid_targets_min": 321
},
{
"epoch": 0.4155614500442087,
"grad_norm": 0.7255450538392068,
"learning_rate": 2.3576826196473553e-05,
"loss": 0.597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33167585730552673,
"step": 235,
"valid_targets_mean": 3975.6,
"valid_targets_min": 1787
},
{
"epoch": 0.4244031830238727,
"grad_norm": 0.7811965432597004,
"learning_rate": 2.408060453400504e-05,
"loss": 0.6116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3258014917373657,
"step": 240,
"valid_targets_mean": 4064.9,
"valid_targets_min": 1431
},
{
"epoch": 0.4332449160035367,
"grad_norm": 0.7283721698739326,
"learning_rate": 2.4584382871536528e-05,
"loss": 0.6241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2866038680076599,
"step": 245,
"valid_targets_mean": 2983.4,
"valid_targets_min": 1332
},
{
"epoch": 0.4420866489832007,
"grad_norm": 0.8218129094311453,
"learning_rate": 2.508816120906801e-05,
"loss": 0.6053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33566445112228394,
"step": 250,
"valid_targets_mean": 3558.0,
"valid_targets_min": 493
},
{
"epoch": 0.4509283819628647,
"grad_norm": 0.7072939560249456,
"learning_rate": 2.55919395465995e-05,
"loss": 0.5453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31181544065475464,
"step": 255,
"valid_targets_mean": 3208.2,
"valid_targets_min": 460
},
{
"epoch": 0.45977011494252873,
"grad_norm": 1.0523349102236121,
"learning_rate": 2.6095717884130986e-05,
"loss": 0.6377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4069092869758606,
"step": 260,
"valid_targets_mean": 3098.2,
"valid_targets_min": 411
},
{
"epoch": 0.46861184792219274,
"grad_norm": 0.6450257152535478,
"learning_rate": 2.659949622166247e-05,
"loss": 0.623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27830231189727783,
"step": 265,
"valid_targets_mean": 4357.8,
"valid_targets_min": 425
},
{
"epoch": 0.47745358090185674,
"grad_norm": 0.7522066599890925,
"learning_rate": 2.7103274559193958e-05,
"loss": 0.5872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18803122639656067,
"step": 270,
"valid_targets_mean": 2124.2,
"valid_targets_min": 409
},
{
"epoch": 0.48629531388152075,
"grad_norm": 0.884412534841973,
"learning_rate": 2.760705289672544e-05,
"loss": 0.616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3839704692363739,
"step": 275,
"valid_targets_mean": 2501.4,
"valid_targets_min": 368
},
{
"epoch": 0.4951370468611848,
"grad_norm": 0.8891118328744042,
"learning_rate": 2.811083123425693e-05,
"loss": 0.6361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3874850273132324,
"step": 280,
"valid_targets_mean": 2678.1,
"valid_targets_min": 1297
},
{
"epoch": 0.5039787798408488,
"grad_norm": 0.8262092882520712,
"learning_rate": 2.8614609571788415e-05,
"loss": 0.605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38311082124710083,
"step": 285,
"valid_targets_mean": 3422.0,
"valid_targets_min": 870
},
{
"epoch": 0.5128205128205128,
"grad_norm": 0.709275574520186,
"learning_rate": 2.91183879093199e-05,
"loss": 0.6046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18932947516441345,
"step": 290,
"valid_targets_mean": 2332.1,
"valid_targets_min": 718
},
{
"epoch": 0.5216622458001768,
"grad_norm": 0.7786332977338201,
"learning_rate": 2.9622166246851387e-05,
"loss": 0.6052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35691413283348083,
"step": 295,
"valid_targets_mean": 3540.5,
"valid_targets_min": 1245
},
{
"epoch": 0.5305039787798409,
"grad_norm": 0.7101179367848214,
"learning_rate": 3.0125944584382876e-05,
"loss": 0.6084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17877447605133057,
"step": 300,
"valid_targets_mean": 2138.0,
"valid_targets_min": 296
},
{
"epoch": 0.5393457117595049,
"grad_norm": 0.7234460485976838,
"learning_rate": 3.062972292191436e-05,
"loss": 0.5926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23484167456626892,
"step": 305,
"valid_targets_mean": 2718.2,
"valid_targets_min": 1374
},
{
"epoch": 0.5481874447391689,
"grad_norm": 0.8316290022850806,
"learning_rate": 3.113350125944585e-05,
"loss": 0.5576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605739235877991,
"step": 310,
"valid_targets_mean": 2342.1,
"valid_targets_min": 390
},
{
"epoch": 0.5570291777188329,
"grad_norm": 0.7443583580419373,
"learning_rate": 3.1637279596977334e-05,
"loss": 0.5824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3526822626590729,
"step": 315,
"valid_targets_mean": 2949.9,
"valid_targets_min": 378
},
{
"epoch": 0.5658709106984969,
"grad_norm": 0.9191837030143825,
"learning_rate": 3.214105793450882e-05,
"loss": 0.5984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35114723443984985,
"step": 320,
"valid_targets_mean": 2730.0,
"valid_targets_min": 479
},
{
"epoch": 0.5747126436781609,
"grad_norm": 0.7133394084017918,
"learning_rate": 3.2644836272040306e-05,
"loss": 0.5448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3304479122161865,
"step": 325,
"valid_targets_mean": 4008.5,
"valid_targets_min": 687
},
{
"epoch": 0.583554376657825,
"grad_norm": 0.7542186085539615,
"learning_rate": 3.314861460957179e-05,
"loss": 0.5912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35879507660865784,
"step": 330,
"valid_targets_mean": 3446.0,
"valid_targets_min": 1762
},
{
"epoch": 0.5923961096374889,
"grad_norm": 0.8806283364510236,
"learning_rate": 3.365239294710328e-05,
"loss": 0.546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2994898855686188,
"step": 335,
"valid_targets_mean": 2490.4,
"valid_targets_min": 1455
},
{
"epoch": 0.601237842617153,
"grad_norm": 0.7925231456510854,
"learning_rate": 3.415617128463476e-05,
"loss": 0.5375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27049198746681213,
"step": 340,
"valid_targets_mean": 3216.2,
"valid_targets_min": 1140
},
{
"epoch": 0.610079575596817,
"grad_norm": 0.8151714993878474,
"learning_rate": 3.465994962216625e-05,
"loss": 0.5658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3359305262565613,
"step": 345,
"valid_targets_mean": 2819.4,
"valid_targets_min": 420
},
{
"epoch": 0.618921308576481,
"grad_norm": 0.6987780960519617,
"learning_rate": 3.516372795969774e-05,
"loss": 0.5964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22273704409599304,
"step": 350,
"valid_targets_mean": 3495.1,
"valid_targets_min": 2035
},
{
"epoch": 0.627763041556145,
"grad_norm": 0.82782268216302,
"learning_rate": 3.566750629722922e-05,
"loss": 0.5694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.282134473323822,
"step": 355,
"valid_targets_mean": 2781.4,
"valid_targets_min": 836
},
{
"epoch": 0.636604774535809,
"grad_norm": 0.7171815954941675,
"learning_rate": 3.617128463476071e-05,
"loss": 0.542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24987182021141052,
"step": 360,
"valid_targets_mean": 2726.6,
"valid_targets_min": 650
},
{
"epoch": 0.6454465075154731,
"grad_norm": 0.6554762528349989,
"learning_rate": 3.667506297229219e-05,
"loss": 0.5764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21046540141105652,
"step": 365,
"valid_targets_mean": 2741.9,
"valid_targets_min": 647
},
{
"epoch": 0.654288240495137,
"grad_norm": 0.7169452163324568,
"learning_rate": 3.717884130982368e-05,
"loss": 0.5865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35952502489089966,
"step": 370,
"valid_targets_mean": 4276.4,
"valid_targets_min": 1909
},
{
"epoch": 0.6631299734748011,
"grad_norm": 0.7498682876453387,
"learning_rate": 3.7682619647355165e-05,
"loss": 0.6103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.398249089717865,
"step": 375,
"valid_targets_mean": 3914.2,
"valid_targets_min": 395
},
{
"epoch": 0.671971706454465,
"grad_norm": 0.7431702929941265,
"learning_rate": 3.8186397984886654e-05,
"loss": 0.5234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36680591106414795,
"step": 380,
"valid_targets_mean": 3600.5,
"valid_targets_min": 653
},
{
"epoch": 0.6808134394341291,
"grad_norm": 0.7032240193017438,
"learning_rate": 3.8690176322418137e-05,
"loss": 0.5644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25154560804367065,
"step": 385,
"valid_targets_mean": 3544.6,
"valid_targets_min": 514
},
{
"epoch": 0.6896551724137931,
"grad_norm": 0.7824728334071819,
"learning_rate": 3.9193954659949626e-05,
"loss": 0.587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2563400864601135,
"step": 390,
"valid_targets_mean": 2525.2,
"valid_targets_min": 417
},
{
"epoch": 0.6984969053934571,
"grad_norm": 0.5938754028594158,
"learning_rate": 3.969773299748111e-05,
"loss": 0.594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36213839054107666,
"step": 395,
"valid_targets_mean": 4965.6,
"valid_targets_min": 1573
},
{
"epoch": 0.7073386383731212,
"grad_norm": 0.8560713693271218,
"learning_rate": 3.999996893720319e-05,
"loss": 0.5368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28493037819862366,
"step": 400,
"valid_targets_mean": 2209.5,
"valid_targets_min": 482
},
{
"epoch": 0.7161803713527851,
"grad_norm": 0.6574999517551925,
"learning_rate": 3.999961948184714e-05,
"loss": 0.5683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27876657247543335,
"step": 405,
"valid_targets_mean": 4695.0,
"valid_targets_min": 739
},
{
"epoch": 0.7250221043324492,
"grad_norm": 0.7910350694289134,
"learning_rate": 3.999888174944605e-05,
"loss": 0.543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29521095752716064,
"step": 410,
"valid_targets_mean": 2854.2,
"valid_targets_min": 572
},
{
"epoch": 0.7338638373121131,
"grad_norm": 0.7327617592282828,
"learning_rate": 3.9997755754322415e-05,
"loss": 0.5316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23895704746246338,
"step": 415,
"valid_targets_mean": 3236.0,
"valid_targets_min": 1129
},
{
"epoch": 0.7427055702917772,
"grad_norm": 0.683762113730083,
"learning_rate": 3.9996241518336554e-05,
"loss": 0.5805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2622902989387512,
"step": 420,
"valid_targets_mean": 3360.2,
"valid_targets_min": 778
},
{
"epoch": 0.7515473032714411,
"grad_norm": 0.6712193589006633,
"learning_rate": 3.999433907088618e-05,
"loss": 0.5688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33563822507858276,
"step": 425,
"valid_targets_mean": 4434.6,
"valid_targets_min": 830
},
{
"epoch": 0.7603890362511052,
"grad_norm": 0.8978969987784136,
"learning_rate": 3.999204844890582e-05,
"loss": 0.5326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21699407696723938,
"step": 430,
"valid_targets_mean": 1812.0,
"valid_targets_min": 380
},
{
"epoch": 0.7692307692307693,
"grad_norm": 0.7936562082241674,
"learning_rate": 3.998936969686614e-05,
"loss": 0.565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2873769700527191,
"step": 435,
"valid_targets_mean": 2613.8,
"valid_targets_min": 351
},
{
"epoch": 0.7780725022104332,
"grad_norm": 0.6494725254339784,
"learning_rate": 3.9986302866773e-05,
"loss": 0.561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27636170387268066,
"step": 440,
"valid_targets_mean": 3525.8,
"valid_targets_min": 515
},
{
"epoch": 0.7869142351900973,
"grad_norm": 0.7239196043024896,
"learning_rate": 3.998284801816654e-05,
"loss": 0.5455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27213937044143677,
"step": 445,
"valid_targets_mean": 2831.9,
"valid_targets_min": 445
},
{
"epoch": 0.7957559681697612,
"grad_norm": 0.6995801380039492,
"learning_rate": 3.997900521811995e-05,
"loss": 0.5635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28841322660446167,
"step": 450,
"valid_targets_mean": 2727.2,
"valid_targets_min": 663
},
{
"epoch": 0.8045977011494253,
"grad_norm": 0.7321413221468167,
"learning_rate": 3.997477454123818e-05,
"loss": 0.5781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2708323299884796,
"step": 455,
"valid_targets_mean": 3125.6,
"valid_targets_min": 1084
},
{
"epoch": 0.8134394341290893,
"grad_norm": 0.834232877873331,
"learning_rate": 3.997015606965656e-05,
"loss": 0.5392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3525821566581726,
"step": 460,
"valid_targets_mean": 2664.1,
"valid_targets_min": 1235
},
{
"epoch": 0.8222811671087533,
"grad_norm": 0.8321360896222851,
"learning_rate": 3.996514989303911e-05,
"loss": 0.6028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32734864950180054,
"step": 465,
"valid_targets_mean": 2494.2,
"valid_targets_min": 1261
},
{
"epoch": 0.8311229000884174,
"grad_norm": 0.6935337345612683,
"learning_rate": 3.9959756108576853e-05,
"loss": 0.5558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24893325567245483,
"step": 470,
"valid_targets_mean": 2565.8,
"valid_targets_min": 1449
},
{
"epoch": 0.8399646330680813,
"grad_norm": 0.8571991620574829,
"learning_rate": 3.995397482098591e-05,
"loss": 0.5884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36881160736083984,
"step": 475,
"valid_targets_mean": 2929.9,
"valid_targets_min": 412
},
{
"epoch": 0.8488063660477454,
"grad_norm": 0.7459479118876244,
"learning_rate": 3.994780614250548e-05,
"loss": 0.5396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3047880232334137,
"step": 480,
"valid_targets_mean": 3779.6,
"valid_targets_min": 2634
},
{
"epoch": 0.8576480990274093,
"grad_norm": 0.7142768197579014,
"learning_rate": 3.994125019289566e-05,
"loss": 0.5359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2945425808429718,
"step": 485,
"valid_targets_mean": 3228.9,
"valid_targets_min": 708
},
{
"epoch": 0.8664898320070734,
"grad_norm": 0.6309840561705765,
"learning_rate": 3.99343070994351e-05,
"loss": 0.5466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996477782726288,
"step": 490,
"valid_targets_mean": 4352.0,
"valid_targets_min": 784
},
{
"epoch": 0.8753315649867374,
"grad_norm": 0.72422812308097,
"learning_rate": 3.992697699691857e-05,
"loss": 0.5754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3740094304084778,
"step": 495,
"valid_targets_mean": 3836.0,
"valid_targets_min": 1609
},
{
"epoch": 0.8841732979664014,
"grad_norm": 0.8938896424491545,
"learning_rate": 3.9919260027654304e-05,
"loss": 0.612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3498684763908386,
"step": 500,
"valid_targets_mean": 2197.9,
"valid_targets_min": 1020
},
{
"epoch": 0.8930150309460654,
"grad_norm": 0.6203004592548081,
"learning_rate": 3.991115634146123e-05,
"loss": 0.5209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26198410987854004,
"step": 505,
"valid_targets_mean": 3834.1,
"valid_targets_min": 1492
},
{
"epoch": 0.9018567639257294,
"grad_norm": 0.8296110311313931,
"learning_rate": 3.990266609566614e-05,
"loss": 0.5822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23738741874694824,
"step": 510,
"valid_targets_mean": 1985.0,
"valid_targets_min": 412
},
{
"epoch": 0.9106984969053935,
"grad_norm": 0.6830643774979811,
"learning_rate": 3.9893789455100514e-05,
"loss": 0.5182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2690092921257019,
"step": 515,
"valid_targets_mean": 3141.5,
"valid_targets_min": 1099
},
{
"epoch": 0.9195402298850575,
"grad_norm": 0.6736971639546346,
"learning_rate": 3.988452659209745e-05,
"loss": 0.5723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22991755604743958,
"step": 520,
"valid_targets_mean": 2799.1,
"valid_targets_min": 829
},
{
"epoch": 0.9283819628647215,
"grad_norm": 0.7173030371663041,
"learning_rate": 3.9874877686488197e-05,
"loss": 0.5628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34016090631484985,
"step": 525,
"valid_targets_mean": 3242.2,
"valid_targets_min": 1744
},
{
"epoch": 0.9372236958443855,
"grad_norm": 0.7040214824132874,
"learning_rate": 3.986484292559877e-05,
"loss": 0.5405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2545274496078491,
"step": 530,
"valid_targets_mean": 3138.1,
"valid_targets_min": 1853
},
{
"epoch": 0.9460654288240495,
"grad_norm": 0.8218611125304961,
"learning_rate": 3.9854422504246224e-05,
"loss": 0.5626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32547083497047424,
"step": 535,
"valid_targets_mean": 2763.6,
"valid_targets_min": 501
},
{
"epoch": 0.9549071618037135,
"grad_norm": 0.6214205266111335,
"learning_rate": 3.984361662473494e-05,
"loss": 0.5616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16753855347633362,
"step": 540,
"valid_targets_mean": 2641.5,
"valid_targets_min": 1835
},
{
"epoch": 0.9637488947833776,
"grad_norm": 0.5778657679333664,
"learning_rate": 3.9832425496852644e-05,
"loss": 0.5737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28100019693374634,
"step": 545,
"valid_targets_mean": 4093.9,
"valid_targets_min": 566
},
{
"epoch": 0.9725906277630415,
"grad_norm": 0.7198881631279556,
"learning_rate": 3.982084933786639e-05,
"loss": 0.5622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2683573067188263,
"step": 550,
"valid_targets_mean": 3153.2,
"valid_targets_min": 460
},
{
"epoch": 0.9814323607427056,
"grad_norm": 0.7294048125531857,
"learning_rate": 3.9808888372518285e-05,
"loss": 0.523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22038066387176514,
"step": 555,
"valid_targets_mean": 2419.9,
"valid_targets_min": 281
},
{
"epoch": 0.9902740937223696,
"grad_norm": 0.7554402239187559,
"learning_rate": 3.979654283302115e-05,
"loss": 0.561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33254435658454895,
"step": 560,
"valid_targets_mean": 3315.4,
"valid_targets_min": 1551
},
{
"epoch": 0.9991158267020336,
"grad_norm": 0.9531782119454033,
"learning_rate": 3.9783812959054054e-05,
"loss": 0.54,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2633528709411621,
"step": 565,
"valid_targets_mean": 2802.5,
"valid_targets_min": 1365
},
{
"epoch": 1.0070733863837311,
"grad_norm": 0.7219142907133131,
"learning_rate": 3.9770698997757564e-05,
"loss": 0.5341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.360717236995697,
"step": 570,
"valid_targets_mean": 3532.2,
"valid_targets_min": 1467
},
{
"epoch": 1.0159151193633953,
"grad_norm": 0.6832964222244942,
"learning_rate": 3.975720120372905e-05,
"loss": 0.5604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3534933924674988,
"step": 575,
"valid_targets_mean": 4285.2,
"valid_targets_min": 473
},
{
"epoch": 1.0247568523430592,
"grad_norm": 0.7104879022906077,
"learning_rate": 3.974331983901766e-05,
"loss": 0.5139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23602774739265442,
"step": 580,
"valid_targets_mean": 3051.0,
"valid_targets_min": 769
},
{
"epoch": 1.0335985853227232,
"grad_norm": 1.0289475556516747,
"learning_rate": 3.972905517311929e-05,
"loss": 0.5025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2523854076862335,
"step": 585,
"valid_targets_mean": 4518.4,
"valid_targets_min": 1272
},
{
"epoch": 1.0424403183023874,
"grad_norm": 0.6070195547061199,
"learning_rate": 3.9714407482971335e-05,
"loss": 0.503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1908818781375885,
"step": 590,
"valid_targets_mean": 3155.4,
"valid_targets_min": 1502
},
{
"epoch": 1.0512820512820513,
"grad_norm": 0.8043171275547331,
"learning_rate": 3.969937705294728e-05,
"loss": 0.5078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33768388628959656,
"step": 595,
"valid_targets_mean": 3010.2,
"valid_targets_min": 1505
},
{
"epoch": 1.0601237842617153,
"grad_norm": 0.7749567786956729,
"learning_rate": 3.968396417485125e-05,
"loss": 0.5508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2937096357345581,
"step": 600,
"valid_targets_mean": 2740.4,
"valid_targets_min": 401
},
{
"epoch": 1.0689655172413792,
"grad_norm": 0.6956637921840406,
"learning_rate": 3.966816914791226e-05,
"loss": 0.5343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3460909426212311,
"step": 605,
"valid_targets_mean": 4797.0,
"valid_targets_min": 1353
},
{
"epoch": 1.0778072502210434,
"grad_norm": 0.8116625470978949,
"learning_rate": 3.965199227877846e-05,
"loss": 0.5254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32285335659980774,
"step": 610,
"valid_targets_mean": 2429.6,
"valid_targets_min": 438
},
{
"epoch": 1.0866489832007074,
"grad_norm": 0.7159169923970375,
"learning_rate": 3.963543388151117e-05,
"loss": 0.5176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2541963458061218,
"step": 615,
"valid_targets_mean": 4086.0,
"valid_targets_min": 702
},
{
"epoch": 1.0954907161803713,
"grad_norm": 0.851138769147014,
"learning_rate": 3.9618494277578806e-05,
"loss": 0.5254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1655346155166626,
"step": 620,
"valid_targets_mean": 1852.5,
"valid_targets_min": 330
},
{
"epoch": 1.1043324491600353,
"grad_norm": 0.7278081843736119,
"learning_rate": 3.960117379585057e-05,
"loss": 0.56,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3517983555793762,
"step": 625,
"valid_targets_mean": 4008.0,
"valid_targets_min": 1452
},
{
"epoch": 1.1131741821396994,
"grad_norm": 0.719616659459927,
"learning_rate": 3.958347277259015e-05,
"loss": 0.4971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31380581855773926,
"step": 630,
"valid_targets_mean": 3580.6,
"valid_targets_min": 309
},
{
"epoch": 1.1220159151193634,
"grad_norm": 0.63160465301193,
"learning_rate": 3.956539155144912e-05,
"loss": 0.5234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2329138219356537,
"step": 635,
"valid_targets_mean": 4057.8,
"valid_targets_min": 1396
},
{
"epoch": 1.1308576480990273,
"grad_norm": 0.6825427065012454,
"learning_rate": 3.9546930483460326e-05,
"loss": 0.516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27975958585739136,
"step": 640,
"valid_targets_mean": 3343.4,
"valid_targets_min": 1645
},
{
"epoch": 1.1396993810786915,
"grad_norm": 0.699265105549181,
"learning_rate": 3.952808992703102e-05,
"loss": 0.5083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23706836998462677,
"step": 645,
"valid_targets_mean": 2710.6,
"valid_targets_min": 507
},
{
"epoch": 1.1485411140583555,
"grad_norm": 0.8045984010228572,
"learning_rate": 3.9508870247935964e-05,
"loss": 0.5351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919955015182495,
"step": 650,
"valid_targets_mean": 1751.8,
"valid_targets_min": 284
},
{
"epoch": 1.1573828470380194,
"grad_norm": 0.6012250412087359,
"learning_rate": 3.948927181931024e-05,
"loss": 0.52,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.263777494430542,
"step": 655,
"valid_targets_mean": 4245.5,
"valid_targets_min": 854
},
{
"epoch": 1.1662245800176834,
"grad_norm": 0.5992821189180728,
"learning_rate": 3.94692950216421e-05,
"loss": 0.5235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23570390045642853,
"step": 660,
"valid_targets_mean": 3959.2,
"valid_targets_min": 276
},
{
"epoch": 1.1750663129973475,
"grad_norm": 0.610845100602426,
"learning_rate": 3.944894024276552e-05,
"loss": 0.5026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1973716914653778,
"step": 665,
"valid_targets_mean": 3387.4,
"valid_targets_min": 675
},
{
"epoch": 1.1839080459770115,
"grad_norm": 0.7207065986679495,
"learning_rate": 3.9428207877852684e-05,
"loss": 0.5115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17878985404968262,
"step": 670,
"valid_targets_mean": 2142.6,
"valid_targets_min": 384
},
{
"epoch": 1.1927497789566754,
"grad_norm": 0.7934727448753174,
"learning_rate": 3.940709832940632e-05,
"loss": 0.5465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2502514123916626,
"step": 675,
"valid_targets_mean": 2718.2,
"valid_targets_min": 1759
},
{
"epoch": 1.2015915119363396,
"grad_norm": 0.7998141403870273,
"learning_rate": 3.938561200725189e-05,
"loss": 0.513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2249201387166977,
"step": 680,
"valid_targets_mean": 2136.0,
"valid_targets_min": 315
},
{
"epoch": 1.2104332449160036,
"grad_norm": 0.6227661283561698,
"learning_rate": 3.9363749328529594e-05,
"loss": 0.5482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.259385883808136,
"step": 685,
"valid_targets_mean": 3826.6,
"valid_targets_min": 1730
},
{
"epoch": 1.2192749778956675,
"grad_norm": 0.6206992015741707,
"learning_rate": 3.934151071768634e-05,
"loss": 0.5537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2900537848472595,
"step": 690,
"valid_targets_mean": 4350.5,
"valid_targets_min": 595
},
{
"epoch": 1.2281167108753315,
"grad_norm": 0.5635939679566414,
"learning_rate": 3.931889660646744e-05,
"loss": 0.5482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2819467782974243,
"step": 695,
"valid_targets_mean": 4096.9,
"valid_targets_min": 1070
},
{
"epoch": 1.2369584438549956,
"grad_norm": 0.6692534359398423,
"learning_rate": 3.9295907433908264e-05,
"loss": 0.5415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2925758361816406,
"step": 700,
"valid_targets_mean": 4126.9,
"valid_targets_min": 1240
},
{
"epoch": 1.2458001768346596,
"grad_norm": 0.7190209534372782,
"learning_rate": 3.9272543646325703e-05,
"loss": 0.5317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19594435393810272,
"step": 705,
"valid_targets_mean": 2114.2,
"valid_targets_min": 1022
},
{
"epoch": 1.2546419098143236,
"grad_norm": 0.7405430028094008,
"learning_rate": 3.924880569730951e-05,
"loss": 0.5281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31587642431259155,
"step": 710,
"valid_targets_mean": 3316.2,
"valid_targets_min": 1055
},
{
"epoch": 1.2634836427939877,
"grad_norm": 0.7318705208252564,
"learning_rate": 3.9224694047713475e-05,
"loss": 0.51,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1906820833683014,
"step": 715,
"valid_targets_mean": 2082.6,
"valid_targets_min": 350
},
{
"epoch": 1.2723253757736517,
"grad_norm": 0.6136614929326403,
"learning_rate": 3.920020916564652e-05,
"loss": 0.504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2813029885292053,
"step": 720,
"valid_targets_mean": 3609.0,
"valid_targets_min": 1686
},
{
"epoch": 1.2811671087533156,
"grad_norm": 0.7619702273083326,
"learning_rate": 3.917535152646356e-05,
"loss": 0.57,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29840072989463806,
"step": 725,
"valid_targets_mean": 3075.8,
"valid_targets_min": 350
},
{
"epoch": 1.2900088417329796,
"grad_norm": 0.6340553976724329,
"learning_rate": 3.915012161275633e-05,
"loss": 0.5579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35292381048202515,
"step": 730,
"valid_targets_mean": 4762.0,
"valid_targets_min": 576
},
{
"epoch": 1.2988505747126438,
"grad_norm": 0.6314054240931711,
"learning_rate": 3.912451991434395e-05,
"loss": 0.5253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2579632103443146,
"step": 735,
"valid_targets_mean": 3673.4,
"valid_targets_min": 591
},
{
"epoch": 1.3076923076923077,
"grad_norm": 0.5775959962805894,
"learning_rate": 3.909854692826348e-05,
"loss": 0.5043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20548564195632935,
"step": 740,
"valid_targets_mean": 3846.4,
"valid_targets_min": 1071
},
{
"epoch": 1.3165340406719717,
"grad_norm": 0.655758917865089,
"learning_rate": 3.9072203158760215e-05,
"loss": 0.5015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2677724361419678,
"step": 745,
"valid_targets_mean": 3850.2,
"valid_targets_min": 515
},
{
"epoch": 1.3253757736516358,
"grad_norm": 0.8148294806624113,
"learning_rate": 3.904548911727793e-05,
"loss": 0.5228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3152320384979248,
"step": 750,
"valid_targets_mean": 3107.8,
"valid_targets_min": 812
},
{
"epoch": 1.3342175066312998,
"grad_norm": 0.8146168712526004,
"learning_rate": 3.901840532244897e-05,
"loss": 0.4892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3347662687301636,
"step": 755,
"valid_targets_mean": 3066.6,
"valid_targets_min": 372
},
{
"epoch": 1.3430592396109637,
"grad_norm": 0.7139126711376225,
"learning_rate": 3.899095230008411e-05,
"loss": 0.4955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2709360718727112,
"step": 760,
"valid_targets_mean": 3221.8,
"valid_targets_min": 275
},
{
"epoch": 1.3519009725906277,
"grad_norm": 0.7341120923859575,
"learning_rate": 3.896313058316242e-05,
"loss": 0.5131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2554779648780823,
"step": 765,
"valid_targets_mean": 3690.6,
"valid_targets_min": 864
},
{
"epoch": 1.3607427055702916,
"grad_norm": 0.7351206776886251,
"learning_rate": 3.8934940711820876e-05,
"loss": 0.5282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886347770690918,
"step": 770,
"valid_targets_mean": 3220.2,
"valid_targets_min": 1394
},
{
"epoch": 1.3695844385499558,
"grad_norm": 0.6815412632856188,
"learning_rate": 3.8906383233343886e-05,
"loss": 0.5301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2817658483982086,
"step": 775,
"valid_targets_mean": 3736.1,
"valid_targets_min": 1035
},
{
"epoch": 1.3784261715296198,
"grad_norm": 0.6083778824304598,
"learning_rate": 3.887745870215268e-05,
"loss": 0.5448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20323900878429413,
"step": 780,
"valid_targets_mean": 3170.0,
"valid_targets_min": 260
},
{
"epoch": 1.387267904509284,
"grad_norm": 0.701861952740278,
"learning_rate": 3.884816767979449e-05,
"loss": 0.5251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28836336731910706,
"step": 785,
"valid_targets_mean": 3401.8,
"valid_targets_min": 1408
},
{
"epoch": 1.396109637488948,
"grad_norm": 0.6895304322708055,
"learning_rate": 3.881851073493174e-05,
"loss": 0.5549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2803962528705597,
"step": 790,
"valid_targets_mean": 3533.6,
"valid_targets_min": 518
},
{
"epoch": 1.4049513704686118,
"grad_norm": 0.8606543782305618,
"learning_rate": 3.878848844333091e-05,
"loss": 0.4985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2970787286758423,
"step": 795,
"valid_targets_mean": 3216.2,
"valid_targets_min": 1616
},
{
"epoch": 1.4137931034482758,
"grad_norm": 0.748948338513349,
"learning_rate": 3.875810138785144e-05,
"loss": 0.517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20471307635307312,
"step": 800,
"valid_targets_mean": 2873.0,
"valid_targets_min": 1791
},
{
"epoch": 1.4226348364279398,
"grad_norm": 0.6282655364858861,
"learning_rate": 3.872735015843435e-05,
"loss": 0.5369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2569165825843811,
"step": 805,
"valid_targets_mean": 4159.0,
"valid_targets_min": 2118
},
{
"epoch": 1.431476569407604,
"grad_norm": 0.6800159245193907,
"learning_rate": 3.8696235352090827e-05,
"loss": 0.4849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21237662434577942,
"step": 810,
"valid_targets_mean": 2913.5,
"valid_targets_min": 1511
},
{
"epoch": 1.4403183023872679,
"grad_norm": 0.7491849980098594,
"learning_rate": 3.8664757572890624e-05,
"loss": 0.5431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31936168670654297,
"step": 815,
"valid_targets_mean": 3183.8,
"valid_targets_min": 443
},
{
"epoch": 1.449160035366932,
"grad_norm": 0.6726532976813931,
"learning_rate": 3.863291743195031e-05,
"loss": 0.5368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3247930407524109,
"step": 820,
"valid_targets_mean": 5290.1,
"valid_targets_min": 1596
},
{
"epoch": 1.458001768346596,
"grad_norm": 0.6414216904520894,
"learning_rate": 3.860071554742144e-05,
"loss": 0.5517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23261283338069916,
"step": 825,
"valid_targets_mean": 2761.5,
"valid_targets_min": 544
},
{
"epoch": 1.46684350132626,
"grad_norm": 0.6133136558161559,
"learning_rate": 3.856815254447854e-05,
"loss": 0.538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27468377351760864,
"step": 830,
"valid_targets_mean": 4492.1,
"valid_targets_min": 1240
},
{
"epoch": 1.475685234305924,
"grad_norm": 0.6535282175604957,
"learning_rate": 3.853522905530698e-05,
"loss": 0.4972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28734225034713745,
"step": 835,
"valid_targets_mean": 4208.9,
"valid_targets_min": 1370
},
{
"epoch": 1.4845269672855879,
"grad_norm": 0.7163769356371759,
"learning_rate": 3.850194571909065e-05,
"loss": 0.5515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21620656549930573,
"step": 840,
"valid_targets_mean": 2672.6,
"valid_targets_min": 530
},
{
"epoch": 1.493368700265252,
"grad_norm": 0.6339266507899239,
"learning_rate": 3.8468303181999625e-05,
"loss": 0.5241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22579747438430786,
"step": 845,
"valid_targets_mean": 3050.4,
"valid_targets_min": 1845
},
{
"epoch": 1.502210433244916,
"grad_norm": 0.6670589515749927,
"learning_rate": 3.843430209717758e-05,
"loss": 0.501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25417882204055786,
"step": 850,
"valid_targets_mean": 2978.0,
"valid_targets_min": 1018
},
{
"epoch": 1.5110521662245802,
"grad_norm": 0.6632769562515543,
"learning_rate": 3.839994312472911e-05,
"loss": 0.5055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.244868203997612,
"step": 855,
"valid_targets_mean": 3159.6,
"valid_targets_min": 395
},
{
"epoch": 1.5198938992042441,
"grad_norm": 0.7476673252142214,
"learning_rate": 3.836522693170692e-05,
"loss": 0.5333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.322563499212265,
"step": 860,
"valid_targets_mean": 3074.9,
"valid_targets_min": 1925
},
{
"epoch": 1.528735632183908,
"grad_norm": 1.182699133656073,
"learning_rate": 3.833015419209888e-05,
"loss": 0.5195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.233692467212677,
"step": 865,
"valid_targets_mean": 2652.8,
"valid_targets_min": 505
},
{
"epoch": 1.537577365163572,
"grad_norm": 0.5963050788873372,
"learning_rate": 3.8294725586814925e-05,
"loss": 0.5379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31656789779663086,
"step": 870,
"valid_targets_mean": 4504.1,
"valid_targets_min": 279
},
{
"epoch": 1.546419098143236,
"grad_norm": 0.7076807714391373,
"learning_rate": 3.8258941803673845e-05,
"loss": 0.4895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21023747324943542,
"step": 875,
"valid_targets_mean": 2384.8,
"valid_targets_min": 663
},
{
"epoch": 1.5552608311229,
"grad_norm": 0.7242194753984217,
"learning_rate": 3.822280353738995e-05,
"loss": 0.5278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15555477142333984,
"step": 880,
"valid_targets_mean": 1807.2,
"valid_targets_min": 367
},
{
"epoch": 1.564102564102564,
"grad_norm": 0.680725926895947,
"learning_rate": 3.818631148955954e-05,
"loss": 0.5183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23022373020648956,
"step": 885,
"valid_targets_mean": 3061.0,
"valid_targets_min": 472
},
{
"epoch": 1.5729442970822283,
"grad_norm": 0.6589551518144537,
"learning_rate": 3.814946636864732e-05,
"loss": 0.5016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3253025710582733,
"step": 890,
"valid_targets_mean": 4214.9,
"valid_targets_min": 464
},
{
"epoch": 1.5817860300618922,
"grad_norm": 0.695071470979805,
"learning_rate": 3.8112268889972635e-05,
"loss": 0.5002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27869266271591187,
"step": 895,
"valid_targets_mean": 3458.9,
"valid_targets_min": 541
},
{
"epoch": 1.5906277630415562,
"grad_norm": 0.6394253917274505,
"learning_rate": 3.807471977569558e-05,
"loss": 0.5247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28981101512908936,
"step": 900,
"valid_targets_mean": 3587.0,
"valid_targets_min": 714
},
{
"epoch": 1.5994694960212201,
"grad_norm": 0.6407279388785145,
"learning_rate": 3.803681975480298e-05,
"loss": 0.5339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30930954217910767,
"step": 905,
"valid_targets_mean": 4241.2,
"valid_targets_min": 1531
},
{
"epoch": 1.608311229000884,
"grad_norm": 0.6262370337590383,
"learning_rate": 3.799856956309424e-05,
"loss": 0.5043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15924446284770966,
"step": 910,
"valid_targets_mean": 2515.5,
"valid_targets_min": 251
},
{
"epoch": 1.617152961980548,
"grad_norm": 0.5799667981131503,
"learning_rate": 3.7959969943167064e-05,
"loss": 0.4945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2013358175754547,
"step": 915,
"valid_targets_mean": 3255.0,
"valid_targets_min": 888
},
{
"epoch": 1.6259946949602122,
"grad_norm": 0.7839747219704393,
"learning_rate": 3.7921021644403024e-05,
"loss": 0.513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39778536558151245,
"step": 920,
"valid_targets_mean": 3479.8,
"valid_targets_min": 1418
},
{
"epoch": 1.6348364279398764,
"grad_norm": 1.0927382964698964,
"learning_rate": 3.788172542295303e-05,
"loss": 0.4882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3143307566642761,
"step": 925,
"valid_targets_mean": 3410.4,
"valid_targets_min": 680
},
{
"epoch": 1.6436781609195403,
"grad_norm": 0.71590844445193,
"learning_rate": 3.784208204172262e-05,
"loss": 0.4901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3356863856315613,
"step": 930,
"valid_targets_mean": 3325.4,
"valid_targets_min": 1757
},
{
"epoch": 1.6525198938992043,
"grad_norm": 0.6973512644137526,
"learning_rate": 3.7802092270357196e-05,
"loss": 0.5329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.272472620010376,
"step": 935,
"valid_targets_mean": 2601.2,
"valid_targets_min": 260
},
{
"epoch": 1.6613616268788682,
"grad_norm": 0.6008785059006879,
"learning_rate": 3.7761756885227046e-05,
"loss": 0.491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2572758197784424,
"step": 940,
"valid_targets_mean": 4301.5,
"valid_targets_min": 2006
},
{
"epoch": 1.6702033598585322,
"grad_norm": 0.5744209498415186,
"learning_rate": 3.772107666941226e-05,
"loss": 0.5167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26439422369003296,
"step": 945,
"valid_targets_mean": 4495.4,
"valid_targets_min": 2496
},
{
"epoch": 1.6790450928381961,
"grad_norm": 0.6465740308526822,
"learning_rate": 3.768005241268757e-05,
"loss": 0.5639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25202465057373047,
"step": 950,
"valid_targets_mean": 3123.2,
"valid_targets_min": 939
},
{
"epoch": 1.6878868258178603,
"grad_norm": 0.7051342522734189,
"learning_rate": 3.7638684911506993e-05,
"loss": 0.5478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1941746175289154,
"step": 955,
"valid_targets_mean": 2783.6,
"valid_targets_min": 466
},
{
"epoch": 1.6967285587975243,
"grad_norm": 0.6946362639039605,
"learning_rate": 3.7596974968988366e-05,
"loss": 0.4773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674318552017212,
"step": 960,
"valid_targets_mean": 2750.2,
"valid_targets_min": 520
},
{
"epoch": 1.7055702917771884,
"grad_norm": 0.6323893584576677,
"learning_rate": 3.755492339489775e-05,
"loss": 0.5122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2906394600868225,
"step": 965,
"valid_targets_mean": 4283.9,
"valid_targets_min": 1633
},
{
"epoch": 1.7144120247568524,
"grad_norm": 0.7054390689371448,
"learning_rate": 3.751253100563373e-05,
"loss": 0.4883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21445819735527039,
"step": 970,
"valid_targets_mean": 2264.2,
"valid_targets_min": 451
},
{
"epoch": 1.7232537577365163,
"grad_norm": 0.7148446633987146,
"learning_rate": 3.746979862421154e-05,
"loss": 0.492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3135313391685486,
"step": 975,
"valid_targets_mean": 4694.2,
"valid_targets_min": 1787
},
{
"epoch": 1.7320954907161803,
"grad_norm": 0.7119677167199814,
"learning_rate": 3.742672708024711e-05,
"loss": 0.5171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30675750970840454,
"step": 980,
"valid_targets_mean": 2838.9,
"valid_targets_min": 482
},
{
"epoch": 1.7409372236958442,
"grad_norm": 0.6482828478440643,
"learning_rate": 3.7383317209940936e-05,
"loss": 0.5151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1551651656627655,
"step": 985,
"valid_targets_mean": 1954.4,
"valid_targets_min": 246
},
{
"epoch": 1.7497789566755084,
"grad_norm": 0.7314955066133645,
"learning_rate": 3.7339569856061864e-05,
"loss": 0.5084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22127586603164673,
"step": 990,
"valid_targets_mean": 2476.5,
"valid_targets_min": 826
},
{
"epoch": 1.7586206896551724,
"grad_norm": 1.098815890414233,
"learning_rate": 3.7295485867930715e-05,
"loss": 0.509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23905551433563232,
"step": 995,
"valid_targets_mean": 2440.1,
"valid_targets_min": 321
},
{
"epoch": 1.7674624226348365,
"grad_norm": 0.6764041908437947,
"learning_rate": 3.72510661014038e-05,
"loss": 0.5291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24814735352993011,
"step": 1000,
"valid_targets_mean": 3079.6,
"valid_targets_min": 1683
},
{
"epoch": 1.7763041556145005,
"grad_norm": 0.5186517018593776,
"learning_rate": 3.720631141885633e-05,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20242926478385925,
"step": 1005,
"valid_targets_mean": 4913.6,
"valid_targets_min": 628
},
{
"epoch": 1.7851458885941645,
"grad_norm": 0.7772370190529831,
"learning_rate": 3.716122268916561e-05,
"loss": 0.4809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2603060007095337,
"step": 1010,
"valid_targets_mean": 3256.9,
"valid_targets_min": 686
},
{
"epoch": 1.7939876215738284,
"grad_norm": 0.5469582973910361,
"learning_rate": 3.711580078769424e-05,
"loss": 0.5089,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27079907059669495,
"step": 1015,
"valid_targets_mean": 4628.6,
"valid_targets_min": 920
},
{
"epoch": 1.8028293545534924,
"grad_norm": 0.6974198275003209,
"learning_rate": 3.707004659627308e-05,
"loss": 0.4978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31995758414268494,
"step": 1020,
"valid_targets_mean": 3138.6,
"valid_targets_min": 636
},
{
"epoch": 1.8116710875331565,
"grad_norm": 0.6920590455597191,
"learning_rate": 3.702396100318414e-05,
"loss": 0.5847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28330913186073303,
"step": 1025,
"valid_targets_mean": 3097.5,
"valid_targets_min": 1473
},
{
"epoch": 1.8205128205128205,
"grad_norm": 0.7496027840560946,
"learning_rate": 3.697754490314335e-05,
"loss": 0.5644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2400278002023697,
"step": 1030,
"valid_targets_mean": 2275.6,
"valid_targets_min": 719
},
{
"epoch": 1.8293545534924847,
"grad_norm": 0.6856958367471065,
"learning_rate": 3.693079919728314e-05,
"loss": 0.4957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2846917510032654,
"step": 1035,
"valid_targets_mean": 3595.0,
"valid_targets_min": 683
},
{
"epoch": 1.8381962864721486,
"grad_norm": 0.5935125821966083,
"learning_rate": 3.688372479313503e-05,
"loss": 0.5339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36108407378196716,
"step": 1040,
"valid_targets_mean": 4035.4,
"valid_targets_min": 1791
},
{
"epoch": 1.8470380194518126,
"grad_norm": 0.7416423484223358,
"learning_rate": 3.683632260461191e-05,
"loss": 0.5628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22433266043663025,
"step": 1045,
"valid_targets_mean": 3904.5,
"valid_targets_min": 1328
},
{
"epoch": 1.8558797524314765,
"grad_norm": 0.6245382430385877,
"learning_rate": 3.6788593551990395e-05,
"loss": 0.4787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25612908601760864,
"step": 1050,
"valid_targets_mean": 3262.2,
"valid_targets_min": 666
},
{
"epoch": 1.8647214854111405,
"grad_norm": 0.6171431811555288,
"learning_rate": 3.674053856189289e-05,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35327455401420593,
"step": 1055,
"valid_targets_mean": 4502.4,
"valid_targets_min": 2273
},
{
"epoch": 1.8735632183908046,
"grad_norm": 0.6939023212762249,
"learning_rate": 3.66921585672696e-05,
"loss": 0.5145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15852488577365875,
"step": 1060,
"valid_targets_mean": 1888.6,
"valid_targets_min": 239
},
{
"epoch": 1.8824049513704686,
"grad_norm": 0.7982037605123552,
"learning_rate": 3.664345450738048e-05,
"loss": 0.4853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16701588034629822,
"step": 1065,
"valid_targets_mean": 1619.1,
"valid_targets_min": 339
},
{
"epoch": 1.8912466843501328,
"grad_norm": 0.608658314659487,
"learning_rate": 3.659442732777694e-05,
"loss": 0.5163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3004249930381775,
"step": 1070,
"valid_targets_mean": 5308.4,
"valid_targets_min": 646
},
{
"epoch": 1.9000884173297967,
"grad_norm": 0.7906418390790385,
"learning_rate": 3.6545077980283516e-05,
"loss": 0.5004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33155688643455505,
"step": 1075,
"valid_targets_mean": 2850.4,
"valid_targets_min": 758
},
{
"epoch": 1.9089301503094607,
"grad_norm": 0.7032647160707013,
"learning_rate": 3.649540742297937e-05,
"loss": 0.5095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2129090428352356,
"step": 1080,
"valid_targets_mean": 2458.6,
"valid_targets_min": 621
},
{
"epoch": 1.9177718832891246,
"grad_norm": 0.6238133398192949,
"learning_rate": 3.6445416620179715e-05,
"loss": 0.4988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.209529310464859,
"step": 1085,
"valid_targets_mean": 3219.8,
"valid_targets_min": 1912
},
{
"epoch": 1.9266136162687886,
"grad_norm": 0.7568137310829532,
"learning_rate": 3.6395106542417066e-05,
"loss": 0.5155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3271511495113373,
"step": 1090,
"valid_targets_mean": 2758.9,
"valid_targets_min": 1274
},
{
"epoch": 1.9354553492484527,
"grad_norm": 0.6192848137574003,
"learning_rate": 3.6344478166422435e-05,
"loss": 0.4981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642071545124054,
"step": 1095,
"valid_targets_mean": 3695.9,
"valid_targets_min": 1417
},
{
"epoch": 1.9442970822281167,
"grad_norm": 0.7309050802016251,
"learning_rate": 3.6293532475106325e-05,
"loss": 0.482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29965919256210327,
"step": 1100,
"valid_targets_mean": 2750.0,
"valid_targets_min": 454
},
{
"epoch": 1.9531388152077809,
"grad_norm": 1.0623788457569725,
"learning_rate": 3.6242270457539695e-05,
"loss": 0.5106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2692793607711792,
"step": 1105,
"valid_targets_mean": 2734.0,
"valid_targets_min": 1420
},
{
"epoch": 1.9619805481874448,
"grad_norm": 0.7151768641889232,
"learning_rate": 3.6190693108934685e-05,
"loss": 0.4966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22051319479942322,
"step": 1110,
"valid_targets_mean": 2504.2,
"valid_targets_min": 515
},
{
"epoch": 1.9708222811671088,
"grad_norm": 0.6957676386448085,
"learning_rate": 3.613880143062539e-05,
"loss": 0.5274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3472147583961487,
"step": 1115,
"valid_targets_mean": 4914.9,
"valid_targets_min": 2074
},
{
"epoch": 1.9796640141467727,
"grad_norm": 0.5806190920195576,
"learning_rate": 3.6086596430048355e-05,
"loss": 0.544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17797411978244781,
"step": 1120,
"valid_targets_mean": 2610.4,
"valid_targets_min": 1172
},
{
"epoch": 1.9885057471264367,
"grad_norm": 0.79939207014776,
"learning_rate": 3.603407912072303e-05,
"loss": 0.4664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3026364743709564,
"step": 1125,
"valid_targets_mean": 2167.8,
"valid_targets_min": 606
},
{
"epoch": 1.9973474801061006,
"grad_norm": 0.6158400263989293,
"learning_rate": 3.598125052223209e-05,
"loss": 0.4927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2575317621231079,
"step": 1130,
"valid_targets_mean": 3856.8,
"valid_targets_min": 266
},
{
"epoch": 2.0053050397877983,
"grad_norm": 0.6506509574828292,
"learning_rate": 3.592811166020166e-05,
"loss": 0.461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540547847747803,
"step": 1135,
"valid_targets_mean": 3808.8,
"valid_targets_min": 433
},
{
"epoch": 2.0141467727674622,
"grad_norm": 0.7334124808950342,
"learning_rate": 3.5874663566281386e-05,
"loss": 0.4984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2256934642791748,
"step": 1140,
"valid_targets_mean": 2785.5,
"valid_targets_min": 435
},
{
"epoch": 2.0229885057471266,
"grad_norm": 0.5825400538253857,
"learning_rate": 3.582090727812441e-05,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22117963433265686,
"step": 1145,
"valid_targets_mean": 5034.1,
"valid_targets_min": 1744
},
{
"epoch": 2.0318302387267906,
"grad_norm": 0.7871465022788394,
"learning_rate": 3.576684383936721e-05,
"loss": 0.4825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28266459703445435,
"step": 1150,
"valid_targets_mean": 2724.8,
"valid_targets_min": 933
},
{
"epoch": 2.0406719717064545,
"grad_norm": 0.6415857615517944,
"learning_rate": 3.571247429960939e-05,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30939337611198425,
"step": 1155,
"valid_targets_mean": 4437.4,
"valid_targets_min": 535
},
{
"epoch": 2.0495137046861185,
"grad_norm": 0.6177273757478585,
"learning_rate": 3.5657799714393226e-05,
"loss": 0.4842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17025458812713623,
"step": 1160,
"valid_targets_mean": 3223.8,
"valid_targets_min": 1553
},
{
"epoch": 2.0583554376657824,
"grad_norm": 0.833706903246219,
"learning_rate": 3.560282114518324e-05,
"loss": 0.4675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26239508390426636,
"step": 1165,
"valid_targets_mean": 2714.1,
"valid_targets_min": 1097
},
{
"epoch": 2.0671971706454464,
"grad_norm": 0.7225359837532538,
"learning_rate": 3.554753965934556e-05,
"loss": 0.4865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35689157247543335,
"step": 1170,
"valid_targets_mean": 4220.5,
"valid_targets_min": 1543
},
{
"epoch": 2.0760389036251103,
"grad_norm": 0.7784056460093122,
"learning_rate": 3.5491956330127206e-05,
"loss": 0.5007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3038363456726074,
"step": 1175,
"valid_targets_mean": 3015.6,
"valid_targets_min": 295
},
{
"epoch": 2.0848806366047747,
"grad_norm": 0.6565097352886429,
"learning_rate": 3.543607223663524e-05,
"loss": 0.4824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24286240339279175,
"step": 1180,
"valid_targets_mean": 3437.2,
"valid_targets_min": 576
},
{
"epoch": 2.0937223695844387,
"grad_norm": 0.6492970939073816,
"learning_rate": 3.537988846381585e-05,
"loss": 0.4959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303530752658844,
"step": 1185,
"valid_targets_mean": 4899.6,
"valid_targets_min": 1488
},
{
"epoch": 2.1025641025641026,
"grad_norm": 0.7925259880545755,
"learning_rate": 3.532340610243325e-05,
"loss": 0.5028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27291086316108704,
"step": 1190,
"valid_targets_mean": 3204.2,
"valid_targets_min": 880
},
{
"epoch": 2.1114058355437666,
"grad_norm": 0.6589724671449128,
"learning_rate": 3.526662624904852e-05,
"loss": 0.4576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2381266951560974,
"step": 1195,
"valid_targets_mean": 3589.5,
"valid_targets_min": 913
},
{
"epoch": 2.1202475685234305,
"grad_norm": 0.7528452910033151,
"learning_rate": 3.5209550005998314e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2670268714427948,
"step": 1200,
"valid_targets_mean": 3119.5,
"valid_targets_min": 531
},
{
"epoch": 2.1290893015030945,
"grad_norm": 0.5446738881024474,
"learning_rate": 3.515217848137347e-05,
"loss": 0.5064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26400917768478394,
"step": 1205,
"valid_targets_mean": 5657.0,
"valid_targets_min": 2360
},
{
"epoch": 2.1379310344827585,
"grad_norm": 0.8894408640488581,
"learning_rate": 3.509451278899748e-05,
"loss": 0.4645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17728659510612488,
"step": 1210,
"valid_targets_mean": 2654.2,
"valid_targets_min": 278
},
{
"epoch": 2.146772767462423,
"grad_norm": 0.7198826676958434,
"learning_rate": 3.503655404840488e-05,
"loss": 0.4721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26327475905418396,
"step": 1215,
"valid_targets_mean": 3134.6,
"valid_targets_min": 283
},
{
"epoch": 2.155614500442087,
"grad_norm": 0.8407871800228818,
"learning_rate": 3.497830338481949e-05,
"loss": 0.4882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.295600950717926,
"step": 1220,
"valid_targets_mean": 2603.4,
"valid_targets_min": 547
},
{
"epoch": 2.1644562334217508,
"grad_norm": 0.6328345124649135,
"learning_rate": 3.491976192913262e-05,
"loss": 0.4497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22263498604297638,
"step": 1225,
"valid_targets_mean": 3946.1,
"valid_targets_min": 447
},
{
"epoch": 2.1732979664014147,
"grad_norm": 0.7203331611468773,
"learning_rate": 3.486093081788106e-05,
"loss": 0.4413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2181500494480133,
"step": 1230,
"valid_targets_mean": 2403.6,
"valid_targets_min": 257
},
{
"epoch": 2.1821396993810787,
"grad_norm": 1.2624507413601598,
"learning_rate": 3.480181119322504e-05,
"loss": 0.5526,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21810586750507355,
"step": 1235,
"valid_targets_mean": 3192.0,
"valid_targets_min": 574
},
{
"epoch": 2.1909814323607426,
"grad_norm": 0.6145928910538749,
"learning_rate": 3.474240420292606e-05,
"loss": 0.4818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26425665616989136,
"step": 1240,
"valid_targets_mean": 4262.5,
"valid_targets_min": 2190
},
{
"epoch": 2.1998231653404066,
"grad_norm": 0.7136638714717287,
"learning_rate": 3.4682711000324586e-05,
"loss": 0.4567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22414344549179077,
"step": 1245,
"valid_targets_mean": 3129.0,
"valid_targets_min": 956
},
{
"epoch": 2.2086648983200705,
"grad_norm": 0.6530586834174523,
"learning_rate": 3.462273274431769e-05,
"loss": 0.4573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2845330536365509,
"step": 1250,
"valid_targets_mean": 3753.6,
"valid_targets_min": 354
},
{
"epoch": 2.217506631299735,
"grad_norm": 0.6049021187332466,
"learning_rate": 3.456247059933653e-05,
"loss": 0.4824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23369532823562622,
"step": 1255,
"valid_targets_mean": 3603.4,
"valid_targets_min": 247
},
{
"epoch": 2.226348364279399,
"grad_norm": 0.7452682692760721,
"learning_rate": 3.450192573532373e-05,
"loss": 0.5275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37186628580093384,
"step": 1260,
"valid_targets_mean": 3171.0,
"valid_targets_min": 718
},
{
"epoch": 2.235190097259063,
"grad_norm": 0.6365702923616391,
"learning_rate": 3.444109932771072e-05,
"loss": 0.4654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261175274848938,
"step": 1265,
"valid_targets_mean": 4370.4,
"valid_targets_min": 1426
},
{
"epoch": 2.2440318302387268,
"grad_norm": 0.5681744054075202,
"learning_rate": 3.4379992557394846e-05,
"loss": 0.5126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20251402258872986,
"step": 1270,
"valid_targets_mean": 4562.1,
"valid_targets_min": 1713
},
{
"epoch": 2.2528735632183907,
"grad_norm": 0.7410762502762586,
"learning_rate": 3.4318606610716484e-05,
"loss": 0.5167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20561201870441437,
"step": 1275,
"valid_targets_mean": 2180.5,
"valid_targets_min": 1254
},
{
"epoch": 2.2617152961980547,
"grad_norm": 0.5452558320658369,
"learning_rate": 3.4256942679436015e-05,
"loss": 0.4922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19533419609069824,
"step": 1280,
"valid_targets_mean": 3569.5,
"valid_targets_min": 1534
},
{
"epoch": 2.270557029177719,
"grad_norm": 0.7468519348908569,
"learning_rate": 3.419500196071067e-05,
"loss": 0.4754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2667611241340637,
"step": 1285,
"valid_targets_mean": 2884.8,
"valid_targets_min": 641
},
{
"epoch": 2.279398762157383,
"grad_norm": 0.6333342302390959,
"learning_rate": 3.413278565707128e-05,
"loss": 0.4993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15673427283763885,
"step": 1290,
"valid_targets_mean": 2277.5,
"valid_targets_min": 340
},
{
"epoch": 2.288240495137047,
"grad_norm": 0.6520958194331384,
"learning_rate": 3.407029497639896e-05,
"loss": 0.4577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2410448044538498,
"step": 1295,
"valid_targets_mean": 3485.1,
"valid_targets_min": 844
},
{
"epoch": 2.297082228116711,
"grad_norm": 0.7282805052878496,
"learning_rate": 3.400753113190164e-05,
"loss": 0.5239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.356065034866333,
"step": 1300,
"valid_targets_mean": 2978.1,
"valid_targets_min": 327
},
{
"epoch": 2.305923961096375,
"grad_norm": 0.7494491120423273,
"learning_rate": 3.394449534209049e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870040535926819,
"step": 1305,
"valid_targets_mean": 3106.1,
"valid_targets_min": 646
},
{
"epoch": 2.314765694076039,
"grad_norm": 0.7866263743420345,
"learning_rate": 3.388118883075632e-05,
"loss": 0.4645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3140355348587036,
"step": 1310,
"valid_targets_mean": 2766.9,
"valid_targets_min": 1396
},
{
"epoch": 2.323607427055703,
"grad_norm": 0.6490756330304519,
"learning_rate": 3.381761282694576e-05,
"loss": 0.4587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1746228039264679,
"step": 1315,
"valid_targets_mean": 1878.6,
"valid_targets_min": 366
},
{
"epoch": 2.3324491600353667,
"grad_norm": 0.5903200212592301,
"learning_rate": 3.375376856493744e-05,
"loss": 0.474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2511587142944336,
"step": 1320,
"valid_targets_mean": 4894.8,
"valid_targets_min": 641
},
{
"epoch": 2.341290893015031,
"grad_norm": 2.254093889370584,
"learning_rate": 3.368965728421802e-05,
"loss": 0.4457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161946639418602,
"step": 1325,
"valid_targets_mean": 2834.8,
"valid_targets_min": 392
},
{
"epoch": 2.350132625994695,
"grad_norm": 0.9142370689095928,
"learning_rate": 3.362528022945811e-05,
"loss": 0.4635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2488413155078888,
"step": 1330,
"valid_targets_mean": 1759.2,
"valid_targets_min": 432
},
{
"epoch": 2.358974358974359,
"grad_norm": 0.6231014207273252,
"learning_rate": 3.3560638650488116e-05,
"loss": 0.481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24347589910030365,
"step": 1335,
"valid_targets_mean": 3643.8,
"valid_targets_min": 1798
},
{
"epoch": 2.367816091954023,
"grad_norm": 0.7798321013057438,
"learning_rate": 3.3495733802273973e-05,
"loss": 0.4947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27684855461120605,
"step": 1340,
"valid_targets_mean": 2807.4,
"valid_targets_min": 671
},
{
"epoch": 2.376657824933687,
"grad_norm": 0.6835229910495109,
"learning_rate": 3.3430566944892797e-05,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20981459319591522,
"step": 1345,
"valid_targets_mean": 2786.4,
"valid_targets_min": 697
},
{
"epoch": 2.385499557913351,
"grad_norm": 0.7027687967506704,
"learning_rate": 3.3365139343508394e-05,
"loss": 0.5036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24709592759609222,
"step": 1350,
"valid_targets_mean": 2751.4,
"valid_targets_min": 429
},
{
"epoch": 2.394341290893015,
"grad_norm": 0.6262006292592385,
"learning_rate": 3.329945226834672e-05,
"loss": 0.4645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18077601492404938,
"step": 1355,
"valid_targets_mean": 2843.1,
"valid_targets_min": 994
},
{
"epoch": 2.4031830238726792,
"grad_norm": 0.6277485840526359,
"learning_rate": 3.3233506994671226e-05,
"loss": 0.4951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2642451524734497,
"step": 1360,
"valid_targets_mean": 3429.4,
"valid_targets_min": 446
},
{
"epoch": 2.412024756852343,
"grad_norm": 0.6280596559682324,
"learning_rate": 3.316730480275804e-05,
"loss": 0.4464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22805391252040863,
"step": 1365,
"valid_targets_mean": 3516.9,
"valid_targets_min": 1427
},
{
"epoch": 2.420866489832007,
"grad_norm": 0.6174264929077061,
"learning_rate": 3.3100846977871205e-05,
"loss": 0.4913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780839502811432,
"step": 1370,
"valid_targets_mean": 4372.0,
"valid_targets_min": 595
},
{
"epoch": 2.429708222811671,
"grad_norm": 0.656729892977582,
"learning_rate": 3.303413481023767e-05,
"loss": 0.4994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19668014347553253,
"step": 1375,
"valid_targets_mean": 2811.8,
"valid_targets_min": 482
},
{
"epoch": 2.438549955791335,
"grad_norm": 0.7226257651578697,
"learning_rate": 3.296716959502222e-05,
"loss": 0.4784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22153441607952118,
"step": 1380,
"valid_targets_mean": 2547.9,
"valid_targets_min": 650
},
{
"epoch": 2.447391688770999,
"grad_norm": 0.7651983874835208,
"learning_rate": 3.2899952632302406e-05,
"loss": 0.4922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565222978591919,
"step": 1385,
"valid_targets_mean": 2316.4,
"valid_targets_min": 389
},
{
"epoch": 2.456233421750663,
"grad_norm": 0.629453575504003,
"learning_rate": 3.2832485227043224e-05,
"loss": 0.4593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19831818342208862,
"step": 1390,
"valid_targets_mean": 3157.9,
"valid_targets_min": 1057
},
{
"epoch": 2.465075154730327,
"grad_norm": 0.6047254462995167,
"learning_rate": 3.276476868907185e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29224517941474915,
"step": 1395,
"valid_targets_mean": 4613.8,
"valid_targets_min": 1331
},
{
"epoch": 2.4739168877099913,
"grad_norm": 0.7333279372759346,
"learning_rate": 3.2696804333052134e-05,
"loss": 0.497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1974330097436905,
"step": 1400,
"valid_targets_mean": 2125.1,
"valid_targets_min": 329
},
{
"epoch": 2.4827586206896552,
"grad_norm": 0.7776273687671615,
"learning_rate": 3.2628593478459166e-05,
"loss": 0.5055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2529323399066925,
"step": 1405,
"valid_targets_mean": 2489.1,
"valid_targets_min": 724
},
{
"epoch": 2.491600353669319,
"grad_norm": 0.7273539498207023,
"learning_rate": 3.256013744955359e-05,
"loss": 0.4718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30455833673477173,
"step": 1410,
"valid_targets_mean": 3809.0,
"valid_targets_min": 1703
},
{
"epoch": 2.500442086648983,
"grad_norm": 0.564269031629325,
"learning_rate": 3.249143757535593e-05,
"loss": 0.4583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21314361691474915,
"step": 1415,
"valid_targets_mean": 3426.6,
"valid_targets_min": 1214
},
{
"epoch": 2.509283819628647,
"grad_norm": 0.5557251931105729,
"learning_rate": 3.242249518962075e-05,
"loss": 0.4994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18279360234737396,
"step": 1420,
"valid_targets_mean": 3213.4,
"valid_targets_min": 1033
},
{
"epoch": 2.5181255526083115,
"grad_norm": 0.550481771742281,
"learning_rate": 3.2353311630810824e-05,
"loss": 0.4564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30488190054893494,
"step": 1425,
"valid_targets_mean": 5551.5,
"valid_targets_min": 1786
},
{
"epoch": 2.5269672855879755,
"grad_norm": 0.7806815136684526,
"learning_rate": 3.2283888242071084e-05,
"loss": 0.4889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23620276153087616,
"step": 1430,
"valid_targets_mean": 2326.1,
"valid_targets_min": 260
},
{
"epoch": 2.5358090185676394,
"grad_norm": 0.6636248793061827,
"learning_rate": 3.221422637120259e-05,
"loss": 0.4679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1364372968673706,
"step": 1435,
"valid_targets_mean": 1784.4,
"valid_targets_min": 384
},
{
"epoch": 2.5446507515473034,
"grad_norm": 0.689385789889328,
"learning_rate": 3.2144327370636346e-05,
"loss": 0.454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20073749125003815,
"step": 1440,
"valid_targets_mean": 3205.1,
"valid_targets_min": 381
},
{
"epoch": 2.5534924845269673,
"grad_norm": 0.6328008971941544,
"learning_rate": 3.2074192597407035e-05,
"loss": 0.4613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3022666573524475,
"step": 1445,
"valid_targets_mean": 4333.4,
"valid_targets_min": 1507
},
{
"epoch": 2.5623342175066313,
"grad_norm": 0.59131850878343,
"learning_rate": 3.200382341312669e-05,
"loss": 0.4492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17799311876296997,
"step": 1450,
"valid_targets_mean": 3369.5,
"valid_targets_min": 1668
},
{
"epoch": 2.571175950486295,
"grad_norm": 0.7805466539055157,
"learning_rate": 3.193322118395825e-05,
"loss": 0.4892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27352964878082275,
"step": 1455,
"valid_targets_mean": 2186.5,
"valid_targets_min": 560
},
{
"epoch": 2.580017683465959,
"grad_norm": 0.6876454265526983,
"learning_rate": 3.1862387280589035e-05,
"loss": 0.4779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3268851041793823,
"step": 1460,
"valid_targets_mean": 3722.8,
"valid_targets_min": 1455
},
{
"epoch": 2.588859416445623,
"grad_norm": 0.6736850428355156,
"learning_rate": 3.179132307820415e-05,
"loss": 0.4415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23798906803131104,
"step": 1465,
"valid_targets_mean": 2838.0,
"valid_targets_min": 682
},
{
"epoch": 2.5977011494252875,
"grad_norm": 0.596929830688196,
"learning_rate": 3.1720029956459765e-05,
"loss": 0.4591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674519419670105,
"step": 1470,
"valid_targets_mean": 4175.8,
"valid_targets_min": 1486
},
{
"epoch": 2.6065428824049515,
"grad_norm": 0.5748031569774971,
"learning_rate": 3.1648509299456354e-05,
"loss": 0.4262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2019733488559723,
"step": 1475,
"valid_targets_mean": 3431.9,
"valid_targets_min": 417
},
{
"epoch": 2.6153846153846154,
"grad_norm": 0.6572317898083503,
"learning_rate": 3.15767624957118e-05,
"loss": 0.5071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3238973915576935,
"step": 1480,
"valid_targets_mean": 4004.2,
"valid_targets_min": 1921
},
{
"epoch": 2.6242263483642794,
"grad_norm": 0.6374727405441111,
"learning_rate": 3.150479093813444e-05,
"loss": 0.4698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257358580827713,
"step": 1485,
"valid_targets_mean": 3410.9,
"valid_targets_min": 1841
},
{
"epoch": 2.6330680813439433,
"grad_norm": 0.7370301376235759,
"learning_rate": 3.143259602399605e-05,
"loss": 0.4813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24704976379871368,
"step": 1490,
"valid_targets_mean": 2845.5,
"valid_targets_min": 494
},
{
"epoch": 2.6419098143236073,
"grad_norm": 0.6458521957650634,
"learning_rate": 3.13601791549047e-05,
"loss": 0.4572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21648521721363068,
"step": 1495,
"valid_targets_mean": 2931.2,
"valid_targets_min": 1190
},
{
"epoch": 2.6507515473032717,
"grad_norm": 0.6857098017912163,
"learning_rate": 3.128754173677753e-05,
"loss": 0.4732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17468172311782837,
"step": 1500,
"valid_targets_mean": 2179.5,
"valid_targets_min": 428
},
{
"epoch": 2.6595932802829356,
"grad_norm": 0.7760295420887048,
"learning_rate": 3.121468517981348e-05,
"loss": 0.4793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2126651257276535,
"step": 1505,
"valid_targets_mean": 2069.2,
"valid_targets_min": 643
},
{
"epoch": 2.6684350132625996,
"grad_norm": 0.7256165385608961,
"learning_rate": 3.1141610898465886e-05,
"loss": 0.4586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24016624689102173,
"step": 1510,
"valid_targets_mean": 2405.6,
"valid_targets_min": 769
},
{
"epoch": 2.6772767462422635,
"grad_norm": 0.8041492470671632,
"learning_rate": 3.106832031141505e-05,
"loss": 0.4882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537711560726166,
"step": 1515,
"valid_targets_mean": 2232.1,
"valid_targets_min": 538
},
{
"epoch": 2.6861184792219275,
"grad_norm": 0.6768740030703516,
"learning_rate": 3.099481484154066e-05,
"loss": 0.4694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770196199417114,
"step": 1520,
"valid_targets_mean": 3394.1,
"valid_targets_min": 951
},
{
"epoch": 2.6949602122015914,
"grad_norm": 0.7614885023952586,
"learning_rate": 3.092109591589421e-05,
"loss": 0.47,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24348753690719604,
"step": 1525,
"valid_targets_mean": 1985.0,
"valid_targets_min": 661
},
{
"epoch": 2.7038019451812554,
"grad_norm": 0.6973530090116009,
"learning_rate": 3.084716496567125e-05,
"loss": 0.4691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2216261327266693,
"step": 1530,
"valid_targets_mean": 2607.2,
"valid_targets_min": 927
},
{
"epoch": 2.7126436781609193,
"grad_norm": 0.6643269820883152,
"learning_rate": 3.0773023426183646e-05,
"loss": 0.5029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21378345787525177,
"step": 1535,
"valid_targets_mean": 2372.9,
"valid_targets_min": 298
},
{
"epoch": 2.7214854111405833,
"grad_norm": 0.6302383408350807,
"learning_rate": 3.069867273683166e-05,
"loss": 0.4813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18604375422000885,
"step": 1540,
"valid_targets_mean": 2405.8,
"valid_targets_min": 708
},
{
"epoch": 2.7303271441202477,
"grad_norm": 0.7402043292567106,
"learning_rate": 3.062411434107607e-05,
"loss": 0.4961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27701494097709656,
"step": 1545,
"valid_targets_mean": 3043.9,
"valid_targets_min": 1120
},
{
"epoch": 2.7391688770999116,
"grad_norm": 0.7333854416465081,
"learning_rate": 3.0549349686410086e-05,
"loss": 0.4807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1735975593328476,
"step": 1550,
"valid_targets_mean": 1787.8,
"valid_targets_min": 1101
},
{
"epoch": 2.7480106100795756,
"grad_norm": 0.5787318917413554,
"learning_rate": 3.0474380224331292e-05,
"loss": 0.4601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26284363865852356,
"step": 1555,
"valid_targets_mean": 3658.6,
"valid_targets_min": 1467
},
{
"epoch": 2.7568523430592395,
"grad_norm": 0.5153363716994127,
"learning_rate": 3.039920741031342e-05,
"loss": 0.452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1932397484779358,
"step": 1560,
"valid_targets_mean": 3985.8,
"valid_targets_min": 2070
},
{
"epoch": 2.7656940760389035,
"grad_norm": 0.7429137625185662,
"learning_rate": 3.0323832703778168e-05,
"loss": 0.477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2431662678718567,
"step": 1565,
"valid_targets_mean": 2817.0,
"valid_targets_min": 1312
},
{
"epoch": 2.774535809018568,
"grad_norm": 0.6481250155554005,
"learning_rate": 3.024825756806677e-05,
"loss": 0.4784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3212037980556488,
"step": 1570,
"valid_targets_mean": 3536.4,
"valid_targets_min": 307
},
{
"epoch": 2.783377541998232,
"grad_norm": 0.5946835818022652,
"learning_rate": 3.017248347041168e-05,
"loss": 0.4674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17257541418075562,
"step": 1575,
"valid_targets_mean": 3216.1,
"valid_targets_min": 338
},
{
"epoch": 2.792219274977896,
"grad_norm": 0.7079495479617642,
"learning_rate": 3.0096511881908007e-05,
"loss": 0.476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25472956895828247,
"step": 1580,
"valid_targets_mean": 2929.1,
"valid_targets_min": 920
},
{
"epoch": 2.8010610079575597,
"grad_norm": 0.6686876235075944,
"learning_rate": 3.0020344277485017e-05,
"loss": 0.48,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24332070350646973,
"step": 1585,
"valid_targets_mean": 3509.1,
"valid_targets_min": 1355
},
{
"epoch": 2.8099027409372237,
"grad_norm": 0.5961265521760359,
"learning_rate": 2.994398213587746e-05,
"loss": 0.4652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16399900615215302,
"step": 1590,
"valid_targets_mean": 2690.2,
"valid_targets_min": 998
},
{
"epoch": 2.8187444739168876,
"grad_norm": 0.6932732714841346,
"learning_rate": 2.9867426939596876e-05,
"loss": 0.4838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23998896777629852,
"step": 1595,
"valid_targets_mean": 2742.6,
"valid_targets_min": 462
},
{
"epoch": 2.8275862068965516,
"grad_norm": 0.6373428022728593,
"learning_rate": 2.9790680174902818e-05,
"loss": 0.4958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28616029024124146,
"step": 1600,
"valid_targets_mean": 3503.4,
"valid_targets_min": 1984
},
{
"epoch": 2.8364279398762156,
"grad_norm": 0.5701727639748247,
"learning_rate": 2.971374333177398e-05,
"loss": 0.4531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2033827304840088,
"step": 1605,
"valid_targets_mean": 3583.5,
"valid_targets_min": 371
},
{
"epoch": 2.8452696728558795,
"grad_norm": 0.6938709515640729,
"learning_rate": 2.963661790387928e-05,
"loss": 0.4687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16415715217590332,
"step": 1610,
"valid_targets_mean": 1516.6,
"valid_targets_min": 348
},
{
"epoch": 2.854111405835544,
"grad_norm": 0.6819822107535831,
"learning_rate": 2.9559305388548884e-05,
"loss": 0.4605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30489426851272583,
"step": 1615,
"valid_targets_mean": 3739.5,
"valid_targets_min": 1669
},
{
"epoch": 2.862953138815208,
"grad_norm": 0.6256616922874445,
"learning_rate": 2.948180728674508e-05,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562219798564911,
"step": 1620,
"valid_targets_mean": 3812.9,
"valid_targets_min": 446
},
{
"epoch": 2.871794871794872,
"grad_norm": 0.6400236041741094,
"learning_rate": 2.9404125103033207e-05,
"loss": 0.4986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29524898529052734,
"step": 1625,
"valid_targets_mean": 4371.4,
"valid_targets_min": 1584
},
{
"epoch": 2.8806366047745358,
"grad_norm": 0.6341608498880749,
"learning_rate": 2.9326260345552384e-05,
"loss": 0.4532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2372559905052185,
"step": 1630,
"valid_targets_mean": 3315.1,
"valid_targets_min": 807
},
{
"epoch": 2.8894783377541997,
"grad_norm": 0.6276072795012839,
"learning_rate": 2.924821452598628e-05,
"loss": 0.4596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32003140449523926,
"step": 1635,
"valid_targets_mean": 4198.9,
"valid_targets_min": 294
},
{
"epoch": 2.898320070733864,
"grad_norm": 0.7616482436393485,
"learning_rate": 2.916998915953373e-05,
"loss": 0.4898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20601674914360046,
"step": 1640,
"valid_targets_mean": 2052.5,
"valid_targets_min": 778
},
{
"epoch": 2.907161803713528,
"grad_norm": 0.5882065240627146,
"learning_rate": 2.9091585764879334e-05,
"loss": 0.4942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24223053455352783,
"step": 1645,
"valid_targets_mean": 4031.1,
"valid_targets_min": 378
},
{
"epoch": 2.916003536693192,
"grad_norm": 0.6054495841065836,
"learning_rate": 2.9013005864163967e-05,
"loss": 0.4683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18661022186279297,
"step": 1650,
"valid_targets_mean": 3359.5,
"valid_targets_min": 1665
},
{
"epoch": 2.924845269672856,
"grad_norm": 0.6838185112738919,
"learning_rate": 2.8934250982955245e-05,
"loss": 0.5104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21030931174755096,
"step": 1655,
"valid_targets_mean": 2463.9,
"valid_targets_min": 367
},
{
"epoch": 2.93368700265252,
"grad_norm": 0.5869513062851025,
"learning_rate": 2.8855322650217878e-05,
"loss": 0.4734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2261839509010315,
"step": 1660,
"valid_targets_mean": 4131.2,
"valid_targets_min": 1915
},
{
"epoch": 2.942528735632184,
"grad_norm": 0.6635908796868752,
"learning_rate": 2.877622239828402e-05,
"loss": 0.4742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3128895163536072,
"step": 1665,
"valid_targets_mean": 3485.6,
"valid_targets_min": 1311
},
{
"epoch": 2.951370468611848,
"grad_norm": 0.5866931808918497,
"learning_rate": 2.8696951762823482e-05,
"loss": 0.4536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27576667070388794,
"step": 1670,
"valid_targets_mean": 5840.1,
"valid_targets_min": 867
},
{
"epoch": 2.9602122015915118,
"grad_norm": 0.7047207677935268,
"learning_rate": 2.8617512282813962e-05,
"loss": 0.4773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672806978225708,
"step": 1675,
"valid_targets_mean": 3142.0,
"valid_targets_min": 411
},
{
"epoch": 2.9690539345711757,
"grad_norm": 0.6805728312782533,
"learning_rate": 2.8537905500511115e-05,
"loss": 0.4409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22739487886428833,
"step": 1680,
"valid_targets_mean": 2617.9,
"valid_targets_min": 488
},
{
"epoch": 2.97789566755084,
"grad_norm": 0.6399928488222026,
"learning_rate": 2.845813296141867e-05,
"loss": 0.4841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33402326703071594,
"step": 1685,
"valid_targets_mean": 3724.4,
"valid_targets_min": 283
},
{
"epoch": 2.986737400530504,
"grad_norm": 0.657324357265603,
"learning_rate": 2.8378196214258368e-05,
"loss": 0.4642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23617523908615112,
"step": 1690,
"valid_targets_mean": 3832.5,
"valid_targets_min": 442
},
{
"epoch": 2.995579133510168,
"grad_norm": 0.7665365085077115,
"learning_rate": 2.8298096810939947e-05,
"loss": 0.4763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22332416474819183,
"step": 1695,
"valid_targets_mean": 2495.6,
"valid_targets_min": 1444
},
{
"epoch": 3.0035366931918657,
"grad_norm": 0.6631145203555193,
"learning_rate": 2.821783630653097e-05,
"loss": 0.4496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41785138845443726,
"step": 1700,
"valid_targets_mean": 4816.5,
"valid_targets_min": 2915
},
{
"epoch": 3.0123784261715296,
"grad_norm": 0.6337435624348,
"learning_rate": 2.8137416259226647e-05,
"loss": 0.4547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2246091365814209,
"step": 1705,
"valid_targets_mean": 3841.2,
"valid_targets_min": 1235
},
{
"epoch": 3.0212201591511936,
"grad_norm": 0.6936797200273987,
"learning_rate": 2.805683823031962e-05,
"loss": 0.4457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1735125035047531,
"step": 1710,
"valid_targets_mean": 2731.0,
"valid_targets_min": 714
},
{
"epoch": 3.0300618921308575,
"grad_norm": 0.7891995315990228,
"learning_rate": 2.797610378416958e-05,
"loss": 0.4231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16492772102355957,
"step": 1715,
"valid_targets_mean": 2113.0,
"valid_targets_min": 578
},
{
"epoch": 3.0389036251105215,
"grad_norm": 0.7386808391583857,
"learning_rate": 2.789521448817297e-05,
"loss": 0.4209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26257234811782837,
"step": 1720,
"valid_targets_mean": 3744.8,
"valid_targets_min": 1677
},
{
"epoch": 3.047745358090186,
"grad_norm": 0.8448422789924801,
"learning_rate": 2.7814171912732505e-05,
"loss": 0.4595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2198343276977539,
"step": 1725,
"valid_targets_mean": 2466.9,
"valid_targets_min": 579
},
{
"epoch": 3.05658709106985,
"grad_norm": 0.5394050393186041,
"learning_rate": 2.7732977631226707e-05,
"loss": 0.4599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662464141845703,
"step": 1730,
"valid_targets_mean": 3657.5,
"valid_targets_min": 418
},
{
"epoch": 3.065428824049514,
"grad_norm": 0.7249259150149697,
"learning_rate": 2.7651633219979354e-05,
"loss": 0.4421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2690415382385254,
"step": 1735,
"valid_targets_mean": 3475.8,
"valid_targets_min": 1327
},
{
"epoch": 3.0742705570291777,
"grad_norm": 0.5613143824306901,
"learning_rate": 2.757014025822887e-05,
"loss": 0.4157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1862303614616394,
"step": 1740,
"valid_targets_mean": 5056.2,
"valid_targets_min": 562
},
{
"epoch": 3.0831122900088417,
"grad_norm": 0.6722692705575857,
"learning_rate": 2.7488500328097676e-05,
"loss": 0.4646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23648124933242798,
"step": 1745,
"valid_targets_mean": 2867.6,
"valid_targets_min": 595
},
{
"epoch": 3.0919540229885056,
"grad_norm": 0.6814783628326924,
"learning_rate": 2.740671501456147e-05,
"loss": 0.4398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12536823749542236,
"step": 1750,
"valid_targets_mean": 1615.6,
"valid_targets_min": 327
},
{
"epoch": 3.1007957559681696,
"grad_norm": 0.6898698530287688,
"learning_rate": 2.732478590541846e-05,
"loss": 0.4825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14612561464309692,
"step": 1755,
"valid_targets_mean": 2145.4,
"valid_targets_min": 409
},
{
"epoch": 3.109637488947834,
"grad_norm": 0.7057545284878672,
"learning_rate": 2.7242714591258515e-05,
"loss": 0.4489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2028021216392517,
"step": 1760,
"valid_targets_mean": 2730.9,
"valid_targets_min": 821
},
{
"epoch": 3.118479221927498,
"grad_norm": 0.7145345954957985,
"learning_rate": 2.716050266543233e-05,
"loss": 0.447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2143976241350174,
"step": 1765,
"valid_targets_mean": 2795.2,
"valid_targets_min": 354
},
{
"epoch": 3.127320954907162,
"grad_norm": 0.6387454256981671,
"learning_rate": 2.707815172402045e-05,
"loss": 0.4511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2258991003036499,
"step": 1770,
"valid_targets_mean": 4250.8,
"valid_targets_min": 292
},
{
"epoch": 3.136162687886826,
"grad_norm": 0.6217741057104463,
"learning_rate": 2.6995663365802297e-05,
"loss": 0.4653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2483760118484497,
"step": 1775,
"valid_targets_mean": 4210.9,
"valid_targets_min": 283
},
{
"epoch": 3.14500442086649,
"grad_norm": 0.6457517067956914,
"learning_rate": 2.6913039192225143e-05,
"loss": 0.4716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32969963550567627,
"step": 1780,
"valid_targets_mean": 4354.4,
"valid_targets_min": 756
},
{
"epoch": 3.1538461538461537,
"grad_norm": 0.6429893214891368,
"learning_rate": 2.683028080737301e-05,
"loss": 0.4321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21806424856185913,
"step": 1785,
"valid_targets_mean": 3157.8,
"valid_targets_min": 532
},
{
"epoch": 3.1626878868258177,
"grad_norm": 0.692439432500108,
"learning_rate": 2.6747389817935513e-05,
"loss": 0.4697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31872475147247314,
"step": 1790,
"valid_targets_mean": 3962.4,
"valid_targets_min": 956
},
{
"epoch": 3.171529619805482,
"grad_norm": 0.655636164934992,
"learning_rate": 2.6664367833176706e-05,
"loss": 0.4435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24065600335597992,
"step": 1795,
"valid_targets_mean": 4039.6,
"valid_targets_min": 767
},
{
"epoch": 3.180371352785146,
"grad_norm": 0.6356274580947101,
"learning_rate": 2.6581216464903783e-05,
"loss": 0.447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21401917934417725,
"step": 1800,
"valid_targets_mean": 3759.8,
"valid_targets_min": 778
},
{
"epoch": 3.18921308576481,
"grad_norm": 0.6755187398673654,
"learning_rate": 2.649793732743585e-05,
"loss": 0.4587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2595488727092743,
"step": 1805,
"valid_targets_mean": 4247.6,
"valid_targets_min": 583
},
{
"epoch": 3.198054818744474,
"grad_norm": 0.6601036816629008,
"learning_rate": 2.641453203757253e-05,
"loss": 0.4575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24937765300273895,
"step": 1810,
"valid_targets_mean": 5081.9,
"valid_targets_min": 1584
},
{
"epoch": 3.206896551724138,
"grad_norm": 0.7345675030768746,
"learning_rate": 2.6331002214562612e-05,
"loss": 0.4535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856788635253906,
"step": 1815,
"valid_targets_mean": 3258.6,
"valid_targets_min": 418
},
{
"epoch": 3.215738284703802,
"grad_norm": 0.6443854997962501,
"learning_rate": 2.624734948007259e-05,
"loss": 0.4782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19514860212802887,
"step": 1820,
"valid_targets_mean": 2690.8,
"valid_targets_min": 1080
},
{
"epoch": 3.224580017683466,
"grad_norm": 0.6505251815752711,
"learning_rate": 2.616357545815518e-05,
"loss": 0.4341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18154998123645782,
"step": 1825,
"valid_targets_mean": 2853.5,
"valid_targets_min": 1039
},
{
"epoch": 3.2334217506631298,
"grad_norm": 0.639089706648105,
"learning_rate": 2.6079681775217833e-05,
"loss": 0.4494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1521425098180771,
"step": 1830,
"valid_targets_mean": 2546.0,
"valid_targets_min": 1092
},
{
"epoch": 3.242263483642794,
"grad_norm": 0.8346126474494834,
"learning_rate": 2.5995670059991085e-05,
"loss": 0.4564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20812271535396576,
"step": 1835,
"valid_targets_mean": 2109.9,
"valid_targets_min": 475
},
{
"epoch": 3.251105216622458,
"grad_norm": 0.6974668474879332,
"learning_rate": 2.5911541943497e-05,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21064886450767517,
"step": 1840,
"valid_targets_mean": 3080.6,
"valid_targets_min": 308
},
{
"epoch": 3.259946949602122,
"grad_norm": 0.7071438987421578,
"learning_rate": 2.582729905901747e-05,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3176460564136505,
"step": 1845,
"valid_targets_mean": 3679.4,
"valid_targets_min": 835
},
{
"epoch": 3.268788682581786,
"grad_norm": 0.8145462041803657,
"learning_rate": 2.574294304206254e-05,
"loss": 0.4524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27845755219459534,
"step": 1850,
"valid_targets_mean": 2862.0,
"valid_targets_min": 557
},
{
"epoch": 3.27763041556145,
"grad_norm": 0.7045266012648904,
"learning_rate": 2.56584755303386e-05,
"loss": 0.4439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2471604347229004,
"step": 1855,
"valid_targets_mean": 3010.8,
"valid_targets_min": 659
},
{
"epoch": 3.286472148541114,
"grad_norm": 0.7384311436163473,
"learning_rate": 2.5573898163716663e-05,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20069456100463867,
"step": 1860,
"valid_targets_mean": 2391.2,
"valid_targets_min": 546
},
{
"epoch": 3.2953138815207783,
"grad_norm": 0.766502608504117,
"learning_rate": 2.5489212584200446e-05,
"loss": 0.448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2833523452281952,
"step": 1865,
"valid_targets_mean": 2948.2,
"valid_targets_min": 340
},
{
"epoch": 3.3041556145004423,
"grad_norm": 0.9146044226587593,
"learning_rate": 2.5404420435894578e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.265963613986969,
"step": 1870,
"valid_targets_mean": 2752.6,
"valid_targets_min": 587
},
{
"epoch": 3.312997347480106,
"grad_norm": 0.557404768668353,
"learning_rate": 2.5319523364972606e-05,
"loss": 0.447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22600683569908142,
"step": 1875,
"valid_targets_mean": 5350.0,
"valid_targets_min": 433
},
{
"epoch": 3.32183908045977,
"grad_norm": 0.7993682463700219,
"learning_rate": 2.5234523019645086e-05,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509821057319641,
"step": 1880,
"valid_targets_mean": 2375.5,
"valid_targets_min": 605
},
{
"epoch": 3.330680813439434,
"grad_norm": 0.58659727071677,
"learning_rate": 2.5149421050127556e-05,
"loss": 0.4341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19044440984725952,
"step": 1885,
"valid_targets_mean": 4073.1,
"valid_targets_min": 1747
},
{
"epoch": 3.339522546419098,
"grad_norm": 0.7845792945000336,
"learning_rate": 2.5064219108608525e-05,
"loss": 0.4351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1808401346206665,
"step": 1890,
"valid_targets_mean": 1915.0,
"valid_targets_min": 461
},
{
"epoch": 3.348364279398762,
"grad_norm": 0.7289729636417263,
"learning_rate": 2.497891884921735e-05,
"loss": 0.4492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19839441776275635,
"step": 1895,
"valid_targets_mean": 2404.8,
"valid_targets_min": 386
},
{
"epoch": 3.357206012378426,
"grad_norm": 0.6820854233253595,
"learning_rate": 2.4893521927992182e-05,
"loss": 0.4703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27235740423202515,
"step": 1900,
"valid_targets_mean": 2999.2,
"valid_targets_min": 442
},
{
"epoch": 3.3660477453580904,
"grad_norm": 0.5855412571643762,
"learning_rate": 2.4808030002847775e-05,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19236628711223602,
"step": 1905,
"valid_targets_mean": 3963.6,
"valid_targets_min": 1110
},
{
"epoch": 3.3748894783377543,
"grad_norm": 0.7338094054626427,
"learning_rate": 2.472244473354332e-05,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22928746044635773,
"step": 1910,
"valid_targets_mean": 2708.8,
"valid_targets_min": 1158
},
{
"epoch": 3.3837312113174183,
"grad_norm": 0.7995982234481557,
"learning_rate": 2.4636767781650183e-05,
"loss": 0.4615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2549368739128113,
"step": 1915,
"valid_targets_mean": 2276.2,
"valid_targets_min": 1059
},
{
"epoch": 3.3925729442970822,
"grad_norm": 0.6376992232354394,
"learning_rate": 2.4551000810519714e-05,
"loss": 0.4899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2908145785331726,
"step": 1920,
"valid_targets_mean": 4513.8,
"valid_targets_min": 294
},
{
"epoch": 3.401414677276746,
"grad_norm": 0.7776074545649672,
"learning_rate": 2.4465145485250888e-05,
"loss": 0.4519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23057112097740173,
"step": 1925,
"valid_targets_mean": 3097.4,
"valid_targets_min": 670
},
{
"epoch": 3.41025641025641,
"grad_norm": 0.7652952479222617,
"learning_rate": 2.437920347265802e-05,
"loss": 0.4214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17387378215789795,
"step": 1930,
"valid_targets_mean": 1660.1,
"valid_targets_min": 289
},
{
"epoch": 3.419098143236074,
"grad_norm": 0.6605377290323325,
"learning_rate": 2.4293176441238396e-05,
"loss": 0.4112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23506543040275574,
"step": 1935,
"valid_targets_mean": 3702.8,
"valid_targets_min": 443
},
{
"epoch": 3.4279398762157385,
"grad_norm": 0.5979410720887383,
"learning_rate": 2.420706606113986e-05,
"loss": 0.4189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2637672424316406,
"step": 1940,
"valid_targets_mean": 4603.4,
"valid_targets_min": 673
},
{
"epoch": 3.4367816091954024,
"grad_norm": 0.5739576956888619,
"learning_rate": 2.4120874004128422e-05,
"loss": 0.4861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22790098190307617,
"step": 1945,
"valid_targets_mean": 3478.2,
"valid_targets_min": 426
},
{
"epoch": 3.4456233421750664,
"grad_norm": 0.6888223638237597,
"learning_rate": 2.4034601943555775e-05,
"loss": 0.4576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896411418914795,
"step": 1950,
"valid_targets_mean": 3563.5,
"valid_targets_min": 296
},
{
"epoch": 3.4544650751547303,
"grad_norm": 0.6188357957447922,
"learning_rate": 2.3948251554326826e-05,
"loss": 0.4412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27495166659355164,
"step": 1955,
"valid_targets_mean": 4352.5,
"valid_targets_min": 572
},
{
"epoch": 3.4633068081343943,
"grad_norm": 0.6700510097036785,
"learning_rate": 2.3861824512867172e-05,
"loss": 0.421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3003349304199219,
"step": 1960,
"valid_targets_mean": 5187.4,
"valid_targets_min": 1645
},
{
"epoch": 3.4721485411140582,
"grad_norm": 0.6558839463348246,
"learning_rate": 2.377532249709054e-05,
"loss": 0.4557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35241687297821045,
"step": 1965,
"valid_targets_mean": 4643.0,
"valid_targets_min": 571
},
{
"epoch": 3.480990274093722,
"grad_norm": 0.6349474618857128,
"learning_rate": 2.368874718636625e-05,
"loss": 0.4472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1423875242471695,
"step": 1970,
"valid_targets_mean": 2537.1,
"valid_targets_min": 694
},
{
"epoch": 3.489832007073386,
"grad_norm": 0.6813167822681871,
"learning_rate": 2.3602100261486557e-05,
"loss": 0.4754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27694791555404663,
"step": 1975,
"valid_targets_mean": 4163.6,
"valid_targets_min": 1557
},
{
"epoch": 3.4986737400530505,
"grad_norm": 0.6514986467289062,
"learning_rate": 2.3515383404634075e-05,
"loss": 0.4378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1669061779975891,
"step": 1980,
"valid_targets_mean": 2230.2,
"valid_targets_min": 296
},
{
"epoch": 3.5075154730327145,
"grad_norm": 0.7914161143585046,
"learning_rate": 2.3428598299349076e-05,
"loss": 0.4694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27049192786216736,
"step": 1985,
"valid_targets_mean": 1989.0,
"valid_targets_min": 267
},
{
"epoch": 3.5163572060123784,
"grad_norm": 0.8656201914218805,
"learning_rate": 2.3341746630496828e-05,
"loss": 0.4454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25898832082748413,
"step": 1990,
"valid_targets_mean": 1998.6,
"valid_targets_min": 734
},
{
"epoch": 3.5251989389920424,
"grad_norm": 0.7646102018521315,
"learning_rate": 2.3254830084234877e-05,
"loss": 0.4168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21087685227394104,
"step": 1995,
"valid_targets_mean": 3901.9,
"valid_targets_min": 1727
},
{
"epoch": 3.5340406719717063,
"grad_norm": 0.7970932854441665,
"learning_rate": 2.316785034798032e-05,
"loss": 0.4506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.256100058555603,
"step": 2000,
"valid_targets_mean": 2907.2,
"valid_targets_min": 1306
},
{
"epoch": 3.5428824049513707,
"grad_norm": 0.7147517419674159,
"learning_rate": 2.308080911037703e-05,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2644729018211365,
"step": 2005,
"valid_targets_mean": 3793.5,
"valid_targets_min": 1606
},
{
"epoch": 3.5517241379310347,
"grad_norm": 0.6331675123587539,
"learning_rate": 2.2993708061262886e-05,
"loss": 0.458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1513529121875763,
"step": 2010,
"valid_targets_mean": 2805.9,
"valid_targets_min": 1291
},
{
"epoch": 3.5605658709106986,
"grad_norm": 0.7549622939379798,
"learning_rate": 2.2906548891636956e-05,
"loss": 0.4567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24897724390029907,
"step": 2015,
"valid_targets_mean": 2534.6,
"valid_targets_min": 1037
},
{
"epoch": 3.5694076038903626,
"grad_norm": 0.9923863265222221,
"learning_rate": 2.2819333293626686e-05,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16775819659233093,
"step": 2020,
"valid_targets_mean": 1303.4,
"valid_targets_min": 324
},
{
"epoch": 3.5782493368700266,
"grad_norm": 0.6137184109496221,
"learning_rate": 2.2732062960455014e-05,
"loss": 0.4373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15827752649784088,
"step": 2025,
"valid_targets_mean": 3152.2,
"valid_targets_min": 308
},
{
"epoch": 3.5870910698496905,
"grad_norm": 0.7316389088145041,
"learning_rate": 2.264473958640753e-05,
"loss": 0.412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19498181343078613,
"step": 2030,
"valid_targets_mean": 2589.9,
"valid_targets_min": 411
},
{
"epoch": 3.5959328028293545,
"grad_norm": 0.7269422076299851,
"learning_rate": 2.2557364866799572e-05,
"loss": 0.4285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3297356367111206,
"step": 2035,
"valid_targets_mean": 3257.0,
"valid_targets_min": 461
},
{
"epoch": 3.6047745358090184,
"grad_norm": 0.6557829256691635,
"learning_rate": 2.246994049794332e-05,
"loss": 0.4663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11620749533176422,
"step": 2040,
"valid_targets_mean": 2108.5,
"valid_targets_min": 1626
},
{
"epoch": 3.6136162687886824,
"grad_norm": 0.6578106972416874,
"learning_rate": 2.2382468177114834e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1800394058227539,
"step": 2045,
"valid_targets_mean": 2848.1,
"valid_targets_min": 491
},
{
"epoch": 3.6224580017683468,
"grad_norm": 0.6460106377859882,
"learning_rate": 2.2294949602521142e-05,
"loss": 0.4664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20682604610919952,
"step": 2050,
"valid_targets_mean": 3096.0,
"valid_targets_min": 401
},
{
"epoch": 3.6312997347480107,
"grad_norm": 0.7686693214243684,
"learning_rate": 2.2207386473267247e-05,
"loss": 0.4407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2174399495124817,
"step": 2055,
"valid_targets_mean": 2397.0,
"valid_targets_min": 638
},
{
"epoch": 3.6401414677276747,
"grad_norm": 0.7189899231337926,
"learning_rate": 2.2119780489323154e-05,
"loss": 0.4363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19445934891700745,
"step": 2060,
"valid_targets_mean": 2458.8,
"valid_targets_min": 990
},
{
"epoch": 3.6489832007073386,
"grad_norm": 0.7020436393545836,
"learning_rate": 2.2032133351490835e-05,
"loss": 0.4571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30607905983924866,
"step": 2065,
"valid_targets_mean": 3775.8,
"valid_targets_min": 1317
},
{
"epoch": 3.6578249336870026,
"grad_norm": 0.7444068107077655,
"learning_rate": 2.1944446761371264e-05,
"loss": 0.4217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22787776589393616,
"step": 2070,
"valid_targets_mean": 2930.4,
"valid_targets_min": 1730
},
{
"epoch": 3.6666666666666665,
"grad_norm": 0.6968317634420128,
"learning_rate": 2.1856722421331322e-05,
"loss": 0.444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15648722648620605,
"step": 2075,
"valid_targets_mean": 2251.6,
"valid_targets_min": 350
},
{
"epoch": 3.675508399646331,
"grad_norm": 0.6959983172874498,
"learning_rate": 2.1768962034470803e-05,
"loss": 0.4696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24266773462295532,
"step": 2080,
"valid_targets_mean": 3423.4,
"valid_targets_min": 384
},
{
"epoch": 3.684350132625995,
"grad_norm": 0.7788541548960379,
"learning_rate": 2.1681167304589295e-05,
"loss": 0.4074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1628911793231964,
"step": 2085,
"valid_targets_mean": 2365.0,
"valid_targets_min": 461
},
{
"epoch": 3.693191865605659,
"grad_norm": 0.7039562542774168,
"learning_rate": 2.1593339936153148e-05,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17437390983104706,
"step": 2090,
"valid_targets_mean": 2311.9,
"valid_targets_min": 1444
},
{
"epoch": 3.7020335985853228,
"grad_norm": 0.5741843896967402,
"learning_rate": 2.1505481634262354e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22777321934700012,
"step": 2095,
"valid_targets_mean": 4313.0,
"valid_targets_min": 1591
},
{
"epoch": 3.7108753315649867,
"grad_norm": 0.7672460830420991,
"learning_rate": 2.141759410461746e-05,
"loss": 0.4182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1350998878479004,
"step": 2100,
"valid_targets_mean": 1726.9,
"valid_targets_min": 382
},
{
"epoch": 3.7197170645446507,
"grad_norm": 0.6710207783728802,
"learning_rate": 2.1329679053486444e-05,
"loss": 0.4478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29351454973220825,
"step": 2105,
"valid_targets_mean": 3874.4,
"valid_targets_min": 1654
},
{
"epoch": 3.7285587975243146,
"grad_norm": 0.6423318027598373,
"learning_rate": 2.1241738187671595e-05,
"loss": 0.4299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19800537824630737,
"step": 2110,
"valid_targets_mean": 2980.0,
"valid_targets_min": 1460
},
{
"epoch": 3.7374005305039786,
"grad_norm": 0.6914935831642892,
"learning_rate": 2.115377321447637e-05,
"loss": 0.4992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1961551457643509,
"step": 2115,
"valid_targets_mean": 3261.6,
"valid_targets_min": 1418
},
{
"epoch": 3.7462422634836425,
"grad_norm": 0.6625084903349797,
"learning_rate": 2.106578584167225e-05,
"loss": 0.4114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027662992477417,
"step": 2120,
"valid_targets_mean": 2802.2,
"valid_targets_min": 610
},
{
"epoch": 3.755083996463307,
"grad_norm": 0.644453283873008,
"learning_rate": 2.0977777777465594e-05,
"loss": 0.4229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17548662424087524,
"step": 2125,
"valid_targets_mean": 3109.0,
"valid_targets_min": 714
},
{
"epoch": 3.763925729442971,
"grad_norm": 0.7667734390353328,
"learning_rate": 2.0889750730464474e-05,
"loss": 0.4612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23370791971683502,
"step": 2130,
"valid_targets_mean": 2261.5,
"valid_targets_min": 598
},
{
"epoch": 3.772767462422635,
"grad_norm": 0.738277857442572,
"learning_rate": 2.0801706409645473e-05,
"loss": 0.4607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21809722483158112,
"step": 2135,
"valid_targets_mean": 3180.4,
"valid_targets_min": 682
},
{
"epoch": 3.781609195402299,
"grad_norm": 0.8463179804355774,
"learning_rate": 2.0713646524320557e-05,
"loss": 0.4408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22101402282714844,
"step": 2140,
"valid_targets_mean": 2733.5,
"valid_targets_min": 477
},
{
"epoch": 3.7904509283819627,
"grad_norm": 0.7086110797536909,
"learning_rate": 2.0625572784103855e-05,
"loss": 0.471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23744723200798035,
"step": 2145,
"valid_targets_mean": 2938.8,
"valid_targets_min": 350
},
{
"epoch": 3.799292661361627,
"grad_norm": 0.6251176123735659,
"learning_rate": 2.053748689887848e-05,
"loss": 0.4261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20360612869262695,
"step": 2150,
"valid_targets_mean": 3229.5,
"valid_targets_min": 844
},
{
"epoch": 3.808134394341291,
"grad_norm": 0.6958759696778948,
"learning_rate": 2.0449390578763336e-05,
"loss": 0.4283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2020493447780609,
"step": 2155,
"valid_targets_mean": 2590.4,
"valid_targets_min": 420
},
{
"epoch": 3.816976127320955,
"grad_norm": 0.7006461931706444,
"learning_rate": 2.036128553407989e-05,
"loss": 0.4411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2114584743976593,
"step": 2160,
"valid_targets_mean": 2864.6,
"valid_targets_min": 616
},
{
"epoch": 3.825817860300619,
"grad_norm": 0.6980121359538078,
"learning_rate": 2.027317347531902e-05,
"loss": 0.4583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2123686671257019,
"step": 2165,
"valid_targets_mean": 3107.0,
"valid_targets_min": 1375
},
{
"epoch": 3.834659593280283,
"grad_norm": 0.7098528867513164,
"learning_rate": 2.0185056113107763e-05,
"loss": 0.495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23799559473991394,
"step": 2170,
"valid_targets_mean": 3973.5,
"valid_targets_min": 1517
},
{
"epoch": 3.843501326259947,
"grad_norm": 0.9443823890149703,
"learning_rate": 2.0096935158176105e-05,
"loss": 0.434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21758808195590973,
"step": 2175,
"valid_targets_mean": 1717.0,
"valid_targets_min": 343
},
{
"epoch": 3.852343059239611,
"grad_norm": 0.8056251979105057,
"learning_rate": 2.000881232132381e-05,
"loss": 0.4657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17145347595214844,
"step": 2180,
"valid_targets_mean": 1844.9,
"valid_targets_min": 606
},
{
"epoch": 3.861184792219275,
"grad_norm": 0.631753151558534,
"learning_rate": 1.9920689313387148e-05,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23968084156513214,
"step": 2185,
"valid_targets_mean": 4621.9,
"valid_targets_min": 1216
},
{
"epoch": 3.8700265251989387,
"grad_norm": 0.5921935896404549,
"learning_rate": 1.9832567845205735e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23088482022285461,
"step": 2190,
"valid_targets_mean": 4285.4,
"valid_targets_min": 363
},
{
"epoch": 3.878868258178603,
"grad_norm": 0.6575693180610859,
"learning_rate": 1.974444962758929e-05,
"loss": 0.4294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.220181405544281,
"step": 2195,
"valid_targets_mean": 3333.4,
"valid_targets_min": 1980
},
{
"epoch": 3.887709991158267,
"grad_norm": 0.6941860616336191,
"learning_rate": 1.9656336371284406e-05,
"loss": 0.4552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22298529744148254,
"step": 2200,
"valid_targets_mean": 2727.5,
"valid_targets_min": 601
},
{
"epoch": 3.896551724137931,
"grad_norm": 0.7225249260002937,
"learning_rate": 1.956822978694137e-05,
"loss": 0.4438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18556898832321167,
"step": 2205,
"valid_targets_mean": 2341.8,
"valid_targets_min": 442
},
{
"epoch": 3.905393457117595,
"grad_norm": 0.7406697584636266,
"learning_rate": 1.9480131585080946e-05,
"loss": 0.4231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2133459746837616,
"step": 2210,
"valid_targets_mean": 2642.8,
"valid_targets_min": 431
},
{
"epoch": 3.914235190097259,
"grad_norm": 0.7039889962915561,
"learning_rate": 1.939204347606115e-05,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2137300670146942,
"step": 2215,
"valid_targets_mean": 2678.2,
"valid_targets_min": 1169
},
{
"epoch": 3.9230769230769234,
"grad_norm": 0.634420740737628,
"learning_rate": 1.9303967170044043e-05,
"loss": 0.4358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17572371661663055,
"step": 2220,
"valid_targets_mean": 3010.6,
"valid_targets_min": 1313
},
{
"epoch": 3.9319186560565873,
"grad_norm": 0.7155018581712755,
"learning_rate": 1.9215904376962555e-05,
"loss": 0.4263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21080003678798676,
"step": 2225,
"valid_targets_mean": 2322.0,
"valid_targets_min": 742
},
{
"epoch": 3.9407603890362513,
"grad_norm": 0.758819158514058,
"learning_rate": 1.9127856806487266e-05,
"loss": 0.4388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16472750902175903,
"step": 2230,
"valid_targets_mean": 2019.2,
"valid_targets_min": 431
},
{
"epoch": 3.949602122015915,
"grad_norm": 0.8777006692099467,
"learning_rate": 1.9039826167993235e-05,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17932608723640442,
"step": 2235,
"valid_targets_mean": 1764.1,
"valid_targets_min": 682
},
{
"epoch": 3.958443854995579,
"grad_norm": 0.6089818772904589,
"learning_rate": 1.895181417052677e-05,
"loss": 0.4231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24629013240337372,
"step": 2240,
"valid_targets_mean": 4223.6,
"valid_targets_min": 459
},
{
"epoch": 3.967285587975243,
"grad_norm": 0.639631153985411,
"learning_rate": 1.88638225227723e-05,
"loss": 0.4245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21447336673736572,
"step": 2245,
"valid_targets_mean": 3402.6,
"valid_targets_min": 424
},
{
"epoch": 3.976127320954907,
"grad_norm": 0.8458138613793146,
"learning_rate": 1.877585293301918e-05,
"loss": 0.4163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22714388370513916,
"step": 2250,
"valid_targets_mean": 2087.0,
"valid_targets_min": 488
},
{
"epoch": 3.984969053934571,
"grad_norm": 0.8014506952688943,
"learning_rate": 1.868790710912853e-05,
"loss": 0.4301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27369236946105957,
"step": 2255,
"valid_targets_mean": 2659.0,
"valid_targets_min": 1183
},
{
"epoch": 3.993810786914235,
"grad_norm": 0.5931369878866818,
"learning_rate": 1.8599986758500047e-05,
"loss": 0.4667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2135334014892578,
"step": 2260,
"valid_targets_mean": 3793.0,
"valid_targets_min": 765
},
{
"epoch": 4.001768346595933,
"grad_norm": 0.6460139121405902,
"learning_rate": 1.8512093588038915e-05,
"loss": 0.4144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2704264223575592,
"step": 2265,
"valid_targets_mean": 4983.9,
"valid_targets_min": 244
},
{
"epoch": 4.010610079575597,
"grad_norm": 0.7103598023526009,
"learning_rate": 1.842422930412262e-05,
"loss": 0.4182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22416162490844727,
"step": 2270,
"valid_targets_mean": 3300.9,
"valid_targets_min": 1126
},
{
"epoch": 4.0194518125552605,
"grad_norm": 0.6926185487221391,
"learning_rate": 1.8336395612567857e-05,
"loss": 0.4081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19507721066474915,
"step": 2275,
"valid_targets_mean": 3702.0,
"valid_targets_min": 308
},
{
"epoch": 4.0282935455349245,
"grad_norm": 0.6966627277554577,
"learning_rate": 1.824859421859736e-05,
"loss": 0.4291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2344420850276947,
"step": 2280,
"valid_targets_mean": 3541.6,
"valid_targets_min": 532
},
{
"epoch": 4.037135278514588,
"grad_norm": 0.8185873096759235,
"learning_rate": 1.8160826826806856e-05,
"loss": 0.4333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16348719596862793,
"step": 2285,
"valid_targets_mean": 1622.6,
"valid_targets_min": 345
},
{
"epoch": 4.045977011494253,
"grad_norm": 0.6298356213417173,
"learning_rate": 1.8073095141131946e-05,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15070627629756927,
"step": 2290,
"valid_targets_mean": 4094.2,
"valid_targets_min": 411
},
{
"epoch": 4.054818744473917,
"grad_norm": 0.7055842030089096,
"learning_rate": 1.7985400864815027e-05,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1813596785068512,
"step": 2295,
"valid_targets_mean": 2406.0,
"valid_targets_min": 429
},
{
"epoch": 4.063660477453581,
"grad_norm": 0.6605651518692166,
"learning_rate": 1.7897745700372194e-05,
"loss": 0.403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19027772545814514,
"step": 2300,
"valid_targets_mean": 3733.2,
"valid_targets_min": 558
},
{
"epoch": 4.072502210433245,
"grad_norm": 0.638116942250368,
"learning_rate": 1.781013134956025e-05,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1789359450340271,
"step": 2305,
"valid_targets_mean": 4052.6,
"valid_targets_min": 1744
},
{
"epoch": 4.081343943412909,
"grad_norm": 0.6312271133669283,
"learning_rate": 1.7722559513343616e-05,
"loss": 0.4298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18907594680786133,
"step": 2310,
"valid_targets_mean": 4083.4,
"valid_targets_min": 312
},
{
"epoch": 4.090185676392573,
"grad_norm": 0.6831522353731495,
"learning_rate": 1.7635031891861334e-05,
"loss": 0.4048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2140839397907257,
"step": 2315,
"valid_targets_mean": 3038.2,
"valid_targets_min": 653
},
{
"epoch": 4.099027409372237,
"grad_norm": 0.7541794171611146,
"learning_rate": 1.7547550184394036e-05,
"loss": 0.3999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14385363459587097,
"step": 2320,
"valid_targets_mean": 1814.5,
"valid_targets_min": 392
},
{
"epoch": 4.107869142351901,
"grad_norm": 0.850080748839246,
"learning_rate": 1.746011608933098e-05,
"loss": 0.4263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1753498613834381,
"step": 2325,
"valid_targets_mean": 2009.9,
"valid_targets_min": 260
},
{
"epoch": 4.116710875331565,
"grad_norm": 0.6727035464038962,
"learning_rate": 1.7372731304137072e-05,
"loss": 0.4234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.156248539686203,
"step": 2330,
"valid_targets_mean": 2836.2,
"valid_targets_min": 1037
},
{
"epoch": 4.125552608311229,
"grad_norm": 0.7915258988052476,
"learning_rate": 1.7285397525319897e-05,
"loss": 0.4209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18911907076835632,
"step": 2335,
"valid_targets_mean": 2722.6,
"valid_targets_min": 558
},
{
"epoch": 4.134394341290893,
"grad_norm": 0.7225681941913896,
"learning_rate": 1.719811644839679e-05,
"loss": 0.4446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2196042686700821,
"step": 2340,
"valid_targets_mean": 2874.2,
"valid_targets_min": 1010
},
{
"epoch": 4.143236074270557,
"grad_norm": 0.6793110061906088,
"learning_rate": 1.711088976786192e-05,
"loss": 0.4049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22990606725215912,
"step": 2345,
"valid_targets_mean": 3720.2,
"valid_targets_min": 1376
},
{
"epoch": 4.152077807250221,
"grad_norm": 0.6309626795534368,
"learning_rate": 1.7023719177153397e-05,
"loss": 0.4287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25914740562438965,
"step": 2350,
"valid_targets_mean": 5181.9,
"valid_targets_min": 365
},
{
"epoch": 4.160919540229885,
"grad_norm": 0.7534348626475472,
"learning_rate": 1.6936606368620393e-05,
"loss": 0.426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30650636553764343,
"step": 2355,
"valid_targets_mean": 3284.2,
"valid_targets_min": 1120
},
{
"epoch": 4.1697612732095495,
"grad_norm": 0.7973625055634738,
"learning_rate": 1.684955303349027e-05,
"loss": 0.4116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11398676037788391,
"step": 2360,
"valid_targets_mean": 1583.0,
"valid_targets_min": 341
},
{
"epoch": 4.178603006189213,
"grad_norm": 0.6773926752150286,
"learning_rate": 1.6762560861835778e-05,
"loss": 0.3691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13966532051563263,
"step": 2365,
"valid_targets_mean": 2208.0,
"valid_targets_min": 1095
},
{
"epoch": 4.187444739168877,
"grad_norm": 0.7600418307606107,
"learning_rate": 1.6675631542542206e-05,
"loss": 0.4199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1887199878692627,
"step": 2370,
"valid_targets_mean": 2575.6,
"valid_targets_min": 1492
},
{
"epoch": 4.196286472148541,
"grad_norm": 0.825716048698755,
"learning_rate": 1.658876676327464e-05,
"loss": 0.4325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17904534935951233,
"step": 2375,
"valid_targets_mean": 1817.2,
"valid_targets_min": 509
},
{
"epoch": 4.205128205128205,
"grad_norm": 0.7357744240798385,
"learning_rate": 1.6501968210445144e-05,
"loss": 0.433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28740018606185913,
"step": 2380,
"valid_targets_mean": 3760.6,
"valid_targets_min": 2060
},
{
"epoch": 4.213969938107869,
"grad_norm": 0.6102035784766663,
"learning_rate": 1.641523756918006e-05,
"loss": 0.4051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19327875971794128,
"step": 2385,
"valid_targets_mean": 4250.9,
"valid_targets_min": 1501
},
{
"epoch": 4.222811671087533,
"grad_norm": 0.6953359184280162,
"learning_rate": 1.6328576523287284e-05,
"loss": 0.4268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.310172438621521,
"step": 2390,
"valid_targets_mean": 4208.6,
"valid_targets_min": 1314
},
{
"epoch": 4.231653404067197,
"grad_norm": 0.7297311607993835,
"learning_rate": 1.6241986755223574e-05,
"loss": 0.4281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32732078433036804,
"step": 2395,
"valid_targets_mean": 3946.0,
"valid_targets_min": 421
},
{
"epoch": 4.240495137046861,
"grad_norm": 0.7130243864792679,
"learning_rate": 1.6155469946061863e-05,
"loss": 0.3957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1902158409357071,
"step": 2400,
"valid_targets_mean": 3486.8,
"valid_targets_min": 1190
},
{
"epoch": 4.249336870026525,
"grad_norm": 0.7379540908447911,
"learning_rate": 1.6069027775458665e-05,
"loss": 0.4381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1608520746231079,
"step": 2405,
"valid_targets_mean": 2679.8,
"valid_targets_min": 1319
},
{
"epoch": 4.258178603006189,
"grad_norm": 0.8452056516818466,
"learning_rate": 1.5982661921621437e-05,
"loss": 0.4092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23513582348823547,
"step": 2410,
"valid_targets_mean": 2361.6,
"valid_targets_min": 426
},
{
"epoch": 4.267020335985853,
"grad_norm": 0.730287777008674,
"learning_rate": 1.5896374061276015e-05,
"loss": 0.4286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2784014344215393,
"step": 2415,
"valid_targets_mean": 5109.2,
"valid_targets_min": 1990
},
{
"epoch": 4.275862068965517,
"grad_norm": 0.7103251487687208,
"learning_rate": 1.5810165869634027e-05,
"loss": 0.4031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2809576392173767,
"step": 2420,
"valid_targets_mean": 5307.9,
"valid_targets_min": 900
},
{
"epoch": 4.284703801945181,
"grad_norm": 0.6866454436464177,
"learning_rate": 1.572403902036042e-05,
"loss": 0.4139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1964649111032486,
"step": 2425,
"valid_targets_mean": 2979.6,
"valid_targets_min": 1814
},
{
"epoch": 4.293545534924846,
"grad_norm": 0.7150372488857892,
"learning_rate": 1.5637995185540932e-05,
"loss": 0.3881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1866159737110138,
"step": 2430,
"valid_targets_mean": 3078.5,
"valid_targets_min": 1192
},
{
"epoch": 4.30238726790451,
"grad_norm": 0.8579495181131218,
"learning_rate": 1.5552036035649656e-05,
"loss": 0.4188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.200179323554039,
"step": 2435,
"valid_targets_mean": 2049.5,
"valid_targets_min": 523
},
{
"epoch": 4.311229000884174,
"grad_norm": 0.7013758701584984,
"learning_rate": 1.5466163239516553e-05,
"loss": 0.3927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30045637488365173,
"step": 2440,
"valid_targets_mean": 3139.2,
"valid_targets_min": 453
},
{
"epoch": 4.3200707338638376,
"grad_norm": 0.7497089575459133,
"learning_rate": 1.5380378464295133e-05,
"loss": 0.3999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16102385520935059,
"step": 2445,
"valid_targets_mean": 2777.8,
"valid_targets_min": 673
},
{
"epoch": 4.3289124668435015,
"grad_norm": 0.7738772317856076,
"learning_rate": 1.5294683375430035e-05,
"loss": 0.45,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24177439510822296,
"step": 2450,
"valid_targets_mean": 3024.8,
"valid_targets_min": 403
},
{
"epoch": 4.3377541998231655,
"grad_norm": 0.8087896123657419,
"learning_rate": 1.520907963662471e-05,
"loss": 0.398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17100030183792114,
"step": 2455,
"valid_targets_mean": 1706.0,
"valid_targets_min": 503
},
{
"epoch": 4.346595932802829,
"grad_norm": 0.6521224471842675,
"learning_rate": 1.5123568909809103e-05,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21314716339111328,
"step": 2460,
"valid_targets_mean": 4596.2,
"valid_targets_min": 1946
},
{
"epoch": 4.355437665782493,
"grad_norm": 0.6730460262609402,
"learning_rate": 1.5038152855107422e-05,
"loss": 0.4331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29492098093032837,
"step": 2465,
"valid_targets_mean": 4156.1,
"valid_targets_min": 286
},
{
"epoch": 4.364279398762157,
"grad_norm": 0.8227541669467124,
"learning_rate": 1.4952833130805884e-05,
"loss": 0.4228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20231404900550842,
"step": 2470,
"valid_targets_mean": 2325.4,
"valid_targets_min": 1373
},
{
"epoch": 4.373121131741821,
"grad_norm": 0.6978839330328747,
"learning_rate": 1.4867611393320533e-05,
"loss": 0.4432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23436486721038818,
"step": 2475,
"valid_targets_mean": 3332.9,
"valid_targets_min": 317
},
{
"epoch": 4.381962864721485,
"grad_norm": 0.7946215788236765,
"learning_rate": 1.478248929716505e-05,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1627664864063263,
"step": 2480,
"valid_targets_mean": 1966.0,
"valid_targets_min": 856
},
{
"epoch": 4.390804597701149,
"grad_norm": 0.7156697773599238,
"learning_rate": 1.4697468494918687e-05,
"loss": 0.4436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.186476469039917,
"step": 2485,
"valid_targets_mean": 2992.4,
"valid_targets_min": 607
},
{
"epoch": 4.399646330680813,
"grad_norm": 0.8727002600998265,
"learning_rate": 1.4612550637194141e-05,
"loss": 0.4475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19441717863082886,
"step": 2490,
"valid_targets_mean": 2303.6,
"valid_targets_min": 708
},
{
"epoch": 4.408488063660477,
"grad_norm": 0.7507265043943055,
"learning_rate": 1.4527737372605529e-05,
"loss": 0.4507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23913750052452087,
"step": 2495,
"valid_targets_mean": 3582.6,
"valid_targets_min": 1482
},
{
"epoch": 4.417329796640141,
"grad_norm": 0.7610940521640887,
"learning_rate": 1.4443030347736347e-05,
"loss": 0.4381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1793220490217209,
"step": 2500,
"valid_targets_mean": 2593.2,
"valid_targets_min": 267
},
{
"epoch": 4.426171529619806,
"grad_norm": 0.6342963620181833,
"learning_rate": 1.435843120710756e-05,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20556139945983887,
"step": 2505,
"valid_targets_mean": 4132.1,
"valid_targets_min": 1120
},
{
"epoch": 4.43501326259947,
"grad_norm": 0.7530536406998339,
"learning_rate": 1.4273941593145636e-05,
"loss": 0.4483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38451525568962097,
"step": 2510,
"valid_targets_mean": 4499.5,
"valid_targets_min": 1789
},
{
"epoch": 4.443854995579134,
"grad_norm": 0.8273793851318227,
"learning_rate": 1.4189563146150669e-05,
"loss": 0.4212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20944646000862122,
"step": 2515,
"valid_targets_mean": 2535.8,
"valid_targets_min": 623
},
{
"epoch": 4.452696728558798,
"grad_norm": 0.7909970336145224,
"learning_rate": 1.4105297504264516e-05,
"loss": 0.4347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3092140555381775,
"step": 2520,
"valid_targets_mean": 3188.4,
"valid_targets_min": 1031
},
{
"epoch": 4.461538461538462,
"grad_norm": 0.9428226334726033,
"learning_rate": 1.4021146303439031e-05,
"loss": 0.4029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2530262768268585,
"step": 2525,
"valid_targets_mean": 2076.4,
"valid_targets_min": 349
},
{
"epoch": 4.470380194518126,
"grad_norm": 0.7317845516311463,
"learning_rate": 1.3937111177404279e-05,
"loss": 0.4369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24385397136211395,
"step": 2530,
"valid_targets_mean": 3438.1,
"valid_targets_min": 1464
},
{
"epoch": 4.47922192749779,
"grad_norm": 0.7770528449780305,
"learning_rate": 1.385319375763682e-05,
"loss": 0.3756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17684635519981384,
"step": 2535,
"valid_targets_mean": 2598.0,
"valid_targets_min": 227
},
{
"epoch": 4.4880636604774535,
"grad_norm": 0.7420657248975656,
"learning_rate": 1.376939567332804e-05,
"loss": 0.4351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18782931566238403,
"step": 2540,
"valid_targets_mean": 2944.4,
"valid_targets_min": 1125
},
{
"epoch": 4.4969053934571175,
"grad_norm": 1.0340838110233663,
"learning_rate": 1.3685718551352518e-05,
"loss": 0.4428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.160398930311203,
"step": 2545,
"valid_targets_mean": 3630.4,
"valid_targets_min": 1189
},
{
"epoch": 4.505747126436781,
"grad_norm": 0.6091047868776585,
"learning_rate": 1.3602164016236444e-05,
"loss": 0.4019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1208481639623642,
"step": 2550,
"valid_targets_mean": 2871.2,
"valid_targets_min": 301
},
{
"epoch": 4.514588859416445,
"grad_norm": 0.7276768828189113,
"learning_rate": 1.3518733690126084e-05,
"loss": 0.4236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21554812788963318,
"step": 2555,
"valid_targets_mean": 3198.2,
"valid_targets_min": 308
},
{
"epoch": 4.523430592396109,
"grad_norm": 0.8138197550507267,
"learning_rate": 1.3435429192756275e-05,
"loss": 0.388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15686780214309692,
"step": 2560,
"valid_targets_mean": 1802.8,
"valid_targets_min": 391
},
{
"epoch": 4.532272325375773,
"grad_norm": 0.7698296993001761,
"learning_rate": 1.3352252141418998e-05,
"loss": 0.4202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21974670886993408,
"step": 2565,
"valid_targets_mean": 2627.8,
"valid_targets_min": 1299
},
{
"epoch": 4.541114058355438,
"grad_norm": 0.6991515960307244,
"learning_rate": 1.3269204150931953e-05,
"loss": 0.4112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1762574017047882,
"step": 2570,
"valid_targets_mean": 2943.6,
"valid_targets_min": 409
},
{
"epoch": 4.549955791335101,
"grad_norm": 0.5961797549163438,
"learning_rate": 1.3186286833607244e-05,
"loss": 0.4039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24313318729400635,
"step": 2575,
"valid_targets_mean": 4766.8,
"valid_targets_min": 662
},
{
"epoch": 4.558797524314766,
"grad_norm": 0.7490840636312823,
"learning_rate": 1.3103501799220033e-05,
"loss": 0.4085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23084694147109985,
"step": 2580,
"valid_targets_mean": 4158.1,
"valid_targets_min": 1584
},
{
"epoch": 4.56763925729443,
"grad_norm": 0.7065075883727937,
"learning_rate": 1.3020850654977333e-05,
"loss": 0.4209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1791738122701645,
"step": 2585,
"valid_targets_mean": 2766.2,
"valid_targets_min": 294
},
{
"epoch": 4.576480990274094,
"grad_norm": 0.6016645740317225,
"learning_rate": 1.293833500548678e-05,
"loss": 0.4446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17156481742858887,
"step": 2590,
"valid_targets_mean": 3903.5,
"valid_targets_min": 1670
},
{
"epoch": 4.585322723253758,
"grad_norm": 0.6114926043432934,
"learning_rate": 1.2855956452725471e-05,
"loss": 0.3752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23596268892288208,
"step": 2595,
"valid_targets_mean": 3700.5,
"valid_targets_min": 682
},
{
"epoch": 4.594164456233422,
"grad_norm": 0.7917827130664251,
"learning_rate": 1.2773716596008889e-05,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21856589615345,
"step": 2600,
"valid_targets_mean": 3063.4,
"valid_targets_min": 844
},
{
"epoch": 4.603006189213086,
"grad_norm": 0.648273474654547,
"learning_rate": 1.2691617031959843e-05,
"loss": 0.4105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17004728317260742,
"step": 2605,
"valid_targets_mean": 3463.0,
"valid_targets_min": 1261
},
{
"epoch": 4.61184792219275,
"grad_norm": 0.8189757224237537,
"learning_rate": 1.2609659354477458e-05,
"loss": 0.4349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3089355528354645,
"step": 2610,
"valid_targets_mean": 3244.4,
"valid_targets_min": 776
},
{
"epoch": 4.620689655172414,
"grad_norm": 0.7858403164318954,
"learning_rate": 1.2527845154706264e-05,
"loss": 0.3781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20955795049667358,
"step": 2615,
"valid_targets_mean": 3477.9,
"valid_targets_min": 906
},
{
"epoch": 4.629531388152078,
"grad_norm": 0.6689115673937959,
"learning_rate": 1.2446176021005245e-05,
"loss": 0.4202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19080306589603424,
"step": 2620,
"valid_targets_mean": 3002.6,
"valid_targets_min": 285
},
{
"epoch": 4.638373121131742,
"grad_norm": 0.6541092626716796,
"learning_rate": 1.2364653538917076e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25211408734321594,
"step": 2625,
"valid_targets_mean": 5283.1,
"valid_targets_min": 593
},
{
"epoch": 4.647214854111406,
"grad_norm": 0.6591383126713584,
"learning_rate": 1.2283279291137291e-05,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23830297589302063,
"step": 2630,
"valid_targets_mean": 4273.6,
"valid_targets_min": 2174
},
{
"epoch": 4.6560565870910695,
"grad_norm": 0.6424277501690692,
"learning_rate": 1.2202054857483576e-05,
"loss": 0.4014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27352088689804077,
"step": 2635,
"valid_targets_mean": 4946.4,
"valid_targets_min": 1302
},
{
"epoch": 4.6648983200707335,
"grad_norm": 0.7211760280647633,
"learning_rate": 1.2120981814865073e-05,
"loss": 0.4114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23283889889717102,
"step": 2640,
"valid_targets_mean": 3097.9,
"valid_targets_min": 392
},
{
"epoch": 4.673740053050398,
"grad_norm": 0.7571275814501419,
"learning_rate": 1.2040061737251807e-05,
"loss": 0.4629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3724607229232788,
"step": 2645,
"valid_targets_mean": 3724.1,
"valid_targets_min": 1291
},
{
"epoch": 4.682581786030062,
"grad_norm": 0.6466326044624365,
"learning_rate": 1.19592961956441e-05,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22775639593601227,
"step": 2650,
"valid_targets_mean": 4530.5,
"valid_targets_min": 1760
},
{
"epoch": 4.691423519009726,
"grad_norm": 0.731960782868472,
"learning_rate": 1.1878686758042086e-05,
"loss": 0.4552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20677362382411957,
"step": 2655,
"valid_targets_mean": 2433.1,
"valid_targets_min": 1698
},
{
"epoch": 4.70026525198939,
"grad_norm": 0.6658248910649158,
"learning_rate": 1.179823498941523e-05,
"loss": 0.4191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20261318981647491,
"step": 2660,
"valid_targets_mean": 3311.1,
"valid_targets_min": 1568
},
{
"epoch": 4.709106984969054,
"grad_norm": 0.7076657293158575,
"learning_rate": 1.1717942451672008e-05,
"loss": 0.4428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2810763120651245,
"step": 2665,
"valid_targets_mean": 4327.8,
"valid_targets_min": 1118
},
{
"epoch": 4.717948717948718,
"grad_norm": 0.7884816045404514,
"learning_rate": 1.1637810703629549e-05,
"loss": 0.4001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21002733707427979,
"step": 2670,
"valid_targets_mean": 2842.2,
"valid_targets_min": 715
},
{
"epoch": 4.726790450928382,
"grad_norm": 0.7169004560389791,
"learning_rate": 1.1557841300983363e-05,
"loss": 0.4537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17877726256847382,
"step": 2675,
"valid_targets_mean": 2562.5,
"valid_targets_min": 643
},
{
"epoch": 4.735632183908046,
"grad_norm": 0.5669741728591965,
"learning_rate": 1.1478035796277158e-05,
"loss": 0.4426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10677316039800644,
"step": 2680,
"valid_targets_mean": 2404.2,
"valid_targets_min": 1020
},
{
"epoch": 4.74447391688771,
"grad_norm": 0.7657675790094381,
"learning_rate": 1.1398395738872683e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494864672422409,
"step": 2685,
"valid_targets_mean": 2797.8,
"valid_targets_min": 818
},
{
"epoch": 4.753315649867374,
"grad_norm": 0.6799388910970321,
"learning_rate": 1.1318922674919675e-05,
"loss": 0.4646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2254074662923813,
"step": 2690,
"valid_targets_mean": 3502.0,
"valid_targets_min": 880
},
{
"epoch": 4.762157382847038,
"grad_norm": 0.7628855637000989,
"learning_rate": 1.1239618147325802e-05,
"loss": 0.3928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2163882851600647,
"step": 2695,
"valid_targets_mean": 2970.4,
"valid_targets_min": 1874
},
{
"epoch": 4.770999115826702,
"grad_norm": 0.7194697076051723,
"learning_rate": 1.116048369572674e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21982774138450623,
"step": 2700,
"valid_targets_mean": 3383.4,
"valid_targets_min": 1312
},
{
"epoch": 4.779840848806366,
"grad_norm": 0.6669494326491152,
"learning_rate": 1.1081520856456267e-05,
"loss": 0.409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23762443661689758,
"step": 2705,
"valid_targets_mean": 3892.1,
"valid_targets_min": 412
},
{
"epoch": 4.78868258178603,
"grad_norm": 0.7108382848669145,
"learning_rate": 1.1002731162516453e-05,
"loss": 0.4359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1936943084001541,
"step": 2710,
"valid_targets_mean": 2535.1,
"valid_targets_min": 1712
},
{
"epoch": 4.797524314765694,
"grad_norm": 0.6713475501297167,
"learning_rate": 1.0924116143547878e-05,
"loss": 0.4171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21732935309410095,
"step": 2715,
"valid_targets_mean": 3802.6,
"valid_targets_min": 1567
},
{
"epoch": 4.8063660477453585,
"grad_norm": 0.7413050176699072,
"learning_rate": 1.0845677325799935e-05,
"loss": 0.4312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25657641887664795,
"step": 2720,
"valid_targets_mean": 3387.0,
"valid_targets_min": 385
},
{
"epoch": 4.815207780725022,
"grad_norm": 0.7577009577762279,
"learning_rate": 1.0767416232101215e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28581398725509644,
"step": 2725,
"valid_targets_mean": 3098.0,
"valid_targets_min": 1745
},
{
"epoch": 4.824049513704686,
"grad_norm": 0.7724716975951001,
"learning_rate": 1.0689334381829948e-05,
"loss": 0.4088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20168830454349518,
"step": 2730,
"valid_targets_mean": 2979.0,
"valid_targets_min": 666
},
{
"epoch": 4.83289124668435,
"grad_norm": 0.7089679302709749,
"learning_rate": 1.0611433290884472e-05,
"loss": 0.4004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11011864989995956,
"step": 2735,
"valid_targets_mean": 2865.8,
"valid_targets_min": 492
},
{
"epoch": 4.841732979664014,
"grad_norm": 0.8144495361272787,
"learning_rate": 1.0533714471653832e-05,
"loss": 0.4312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19665873050689697,
"step": 2740,
"valid_targets_mean": 2790.5,
"valid_targets_min": 368
},
{
"epoch": 4.850574712643678,
"grad_norm": 0.77684643133323,
"learning_rate": 1.04561794329884e-05,
"loss": 0.4497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21007674932479858,
"step": 2745,
"valid_targets_mean": 2555.6,
"valid_targets_min": 1571
},
{
"epoch": 4.859416445623342,
"grad_norm": 0.742546614835338,
"learning_rate": 1.0378829680170622e-05,
"loss": 0.4322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3378821611404419,
"step": 2750,
"valid_targets_mean": 4008.6,
"valid_targets_min": 1946
},
{
"epoch": 4.868258178603006,
"grad_norm": 0.7479115324842988,
"learning_rate": 1.0301666714885725e-05,
"loss": 0.4325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2188922017812729,
"step": 2755,
"valid_targets_mean": 3129.8,
"valid_targets_min": 1540
},
{
"epoch": 4.87709991158267,
"grad_norm": 0.7454709519506926,
"learning_rate": 1.0224692035192625e-05,
"loss": 0.4438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28481394052505493,
"step": 2760,
"valid_targets_mean": 3897.9,
"valid_targets_min": 1390
},
{
"epoch": 4.885941644562334,
"grad_norm": 0.769621578421721,
"learning_rate": 1.0147907135494803e-05,
"loss": 0.4236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15574485063552856,
"step": 2765,
"valid_targets_mean": 2061.8,
"valid_targets_min": 933
},
{
"epoch": 4.894783377541998,
"grad_norm": 0.7396299843802391,
"learning_rate": 1.0071313506511334e-05,
"loss": 0.3959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16915792226791382,
"step": 2770,
"valid_targets_mean": 2474.2,
"valid_targets_min": 598
},
{
"epoch": 4.903625110521662,
"grad_norm": 0.6989394194624301,
"learning_rate": 9.9949126352479e-06,
"loss": 0.3991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22265878319740295,
"step": 2775,
"valid_targets_mean": 3984.8,
"valid_targets_min": 1638
},
{
"epoch": 4.912466843501326,
"grad_norm": 0.6502932314793353,
"learning_rate": 9.918706004967948e-06,
"loss": 0.4288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32565969228744507,
"step": 2780,
"valid_targets_mean": 4374.5,
"valid_targets_min": 1492
},
{
"epoch": 4.921308576480991,
"grad_norm": 0.7229307437239456,
"learning_rate": 9.842695095163878e-06,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24379673600196838,
"step": 2785,
"valid_targets_mean": 3383.4,
"valid_targets_min": 974
},
{
"epoch": 4.930150309460654,
"grad_norm": 0.7940649246854591,
"learning_rate": 9.766881381528357e-06,
"loss": 0.4199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25852537155151367,
"step": 2790,
"valid_targets_mean": 3000.1,
"valid_targets_min": 760
},
{
"epoch": 4.938992042440319,
"grad_norm": 0.6722076902519407,
"learning_rate": 9.691266335925615e-06,
"loss": 0.4507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1473044753074646,
"step": 2795,
"valid_targets_mean": 2647.0,
"valid_targets_min": 648
},
{
"epoch": 4.947833775419983,
"grad_norm": 0.819920472445427,
"learning_rate": 9.615851426362904e-06,
"loss": 0.4385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1795499622821808,
"step": 2800,
"valid_targets_mean": 2951.1,
"valid_targets_min": 1215
},
{
"epoch": 4.9566755083996465,
"grad_norm": 0.7025906740887181,
"learning_rate": 9.540638116961986e-06,
"loss": 0.4195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25529012084007263,
"step": 2805,
"valid_targets_mean": 3555.2,
"valid_targets_min": 1071
},
{
"epoch": 4.9655172413793105,
"grad_norm": 0.7370327390638789,
"learning_rate": 9.465627867930734e-06,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20865119993686676,
"step": 2810,
"valid_targets_mean": 2461.0,
"valid_targets_min": 257
},
{
"epoch": 4.9743589743589745,
"grad_norm": 0.6324581481449822,
"learning_rate": 9.390822135534738e-06,
"loss": 0.4037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20276159048080444,
"step": 2815,
"valid_targets_mean": 3668.0,
"valid_targets_min": 1824
},
{
"epoch": 4.983200707338638,
"grad_norm": 0.7834993482168726,
"learning_rate": 9.31622237206907e-06,
"loss": 0.4356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17606160044670105,
"step": 2820,
"valid_targets_mean": 2788.4,
"valid_targets_min": 456
},
{
"epoch": 4.992042440318302,
"grad_norm": 0.6837420383955042,
"learning_rate": 9.241830025830059e-06,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18292655050754547,
"step": 2825,
"valid_targets_mean": 3192.5,
"valid_targets_min": 743
},
{
"epoch": 5.0,
"grad_norm": 1.1516433834283342,
"learning_rate": 9.167646541087216e-06,
"loss": 0.4185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4343792200088501,
"step": 2830,
"valid_targets_mean": 2228.5,
"valid_targets_min": 488
},
{
"epoch": 5.008841732979664,
"grad_norm": 0.7806271076048815,
"learning_rate": 9.09367335805515e-06,
"loss": 0.418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21847274899482727,
"step": 2835,
"valid_targets_mean": 3220.6,
"valid_targets_min": 649
},
{
"epoch": 5.017683465959328,
"grad_norm": 0.6706581564830443,
"learning_rate": 9.019911912865634e-06,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25733518600463867,
"step": 2840,
"valid_targets_mean": 3993.9,
"valid_targets_min": 1384
},
{
"epoch": 5.026525198938992,
"grad_norm": 0.728929240628752,
"learning_rate": 8.946363637539699e-06,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16333594918251038,
"step": 2845,
"valid_targets_mean": 2894.0,
"valid_targets_min": 487
},
{
"epoch": 5.035366931918656,
"grad_norm": 0.728458524357944,
"learning_rate": 8.87302995995988e-06,
"loss": 0.387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20494450628757477,
"step": 2850,
"valid_targets_mean": 3790.2,
"valid_targets_min": 1159
},
{
"epoch": 5.04420866489832,
"grad_norm": 0.7084662868772482,
"learning_rate": 8.799912303842437e-06,
"loss": 0.4087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20348328351974487,
"step": 2855,
"valid_targets_mean": 3220.6,
"valid_targets_min": 406
},
{
"epoch": 5.053050397877984,
"grad_norm": 0.7088150993211034,
"learning_rate": 8.727012088709751e-06,
"loss": 0.3722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22844524681568146,
"step": 2860,
"valid_targets_mean": 4072.2,
"valid_targets_min": 1095
},
{
"epoch": 5.061892130857648,
"grad_norm": 0.8455946822457715,
"learning_rate": 8.654330729862752e-06,
"loss": 0.3869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19593322277069092,
"step": 2865,
"valid_targets_mean": 2430.2,
"valid_targets_min": 432
},
{
"epoch": 5.0707338638373125,
"grad_norm": 0.5858642767010211,
"learning_rate": 8.58186963835346e-06,
"loss": 0.3783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21078699827194214,
"step": 2870,
"valid_targets_mean": 4977.0,
"valid_targets_min": 1444
},
{
"epoch": 5.0795755968169765,
"grad_norm": 0.7994534314183666,
"learning_rate": 8.509630220957554e-06,
"loss": 0.4093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19775576889514923,
"step": 2875,
"valid_targets_mean": 2545.8,
"valid_targets_min": 573
},
{
"epoch": 5.08841732979664,
"grad_norm": 0.8314569923246584,
"learning_rate": 8.437613880147093e-06,
"loss": 0.3913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1837921142578125,
"step": 2880,
"valid_targets_mean": 2678.4,
"valid_targets_min": 459
},
{
"epoch": 5.097259062776304,
"grad_norm": 0.7860099404554846,
"learning_rate": 8.365822014063287e-06,
"loss": 0.3658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17934468388557434,
"step": 2885,
"valid_targets_mean": 3174.5,
"valid_targets_min": 512
},
{
"epoch": 5.106100795755968,
"grad_norm": 0.7604145315647566,
"learning_rate": 8.29425601648933e-06,
"loss": 0.3952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21388058364391327,
"step": 2890,
"valid_targets_mean": 2896.4,
"valid_targets_min": 353
},
{
"epoch": 5.114942528735632,
"grad_norm": 0.8107815627893672,
"learning_rate": 8.222917276823361e-06,
"loss": 0.3976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22443638741970062,
"step": 2895,
"valid_targets_mean": 3731.9,
"valid_targets_min": 1274
},
{
"epoch": 5.123784261715296,
"grad_norm": 0.7079702745049611,
"learning_rate": 8.151807180051474e-06,
"loss": 0.4313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25032246112823486,
"step": 2900,
"valid_targets_mean": 3908.5,
"valid_targets_min": 386
},
{
"epoch": 5.13262599469496,
"grad_norm": 0.7899459874887411,
"learning_rate": 8.080927106720862e-06,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1818743646144867,
"step": 2905,
"valid_targets_mean": 2431.4,
"valid_targets_min": 258
},
{
"epoch": 5.141467727674624,
"grad_norm": 0.8962540094006461,
"learning_rate": 8.010278432912971e-06,
"loss": 0.4258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31215745210647583,
"step": 2910,
"valid_targets_mean": 3037.2,
"valid_targets_min": 1060
},
{
"epoch": 5.150309460654288,
"grad_norm": 0.7521497447867146,
"learning_rate": 7.939862530216808e-06,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18189725279808044,
"step": 2915,
"valid_targets_mean": 2674.8,
"valid_targets_min": 979
},
{
"epoch": 5.159151193633952,
"grad_norm": 0.7250094122688368,
"learning_rate": 7.869680765702313e-06,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579514592885971,
"step": 2920,
"valid_targets_mean": 2929.2,
"valid_targets_min": 1224
},
{
"epoch": 5.167992926613616,
"grad_norm": 0.7675162922726106,
"learning_rate": 7.799734501893825e-06,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1362682580947876,
"step": 2925,
"valid_targets_mean": 2386.4,
"valid_targets_min": 618
},
{
"epoch": 5.17683465959328,
"grad_norm": 0.6709418238351449,
"learning_rate": 7.730025096743601e-06,
"loss": 0.4124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16993936896324158,
"step": 2930,
"valid_targets_mean": 3081.4,
"valid_targets_min": 358
},
{
"epoch": 5.185676392572944,
"grad_norm": 0.6432114501479861,
"learning_rate": 7.6605539036055e-06,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1883753538131714,
"step": 2935,
"valid_targets_mean": 4789.6,
"valid_targets_min": 321
},
{
"epoch": 5.194518125552609,
"grad_norm": 0.7001052560650384,
"learning_rate": 7.591322271208639e-06,
"loss": 0.3833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1550978720188141,
"step": 2940,
"valid_targets_mean": 2667.6,
"valid_targets_min": 1459
},
{
"epoch": 5.203359858532273,
"grad_norm": 1.0203017538563217,
"learning_rate": 7.522331543631289e-06,
"loss": 0.3966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27559781074523926,
"step": 2945,
"valid_targets_mean": 2583.2,
"valid_targets_min": 558
},
{
"epoch": 5.212201591511937,
"grad_norm": 0.63220733334086,
"learning_rate": 7.453583060274714e-06,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1653447449207306,
"step": 2950,
"valid_targets_mean": 4349.5,
"valid_targets_min": 2007
},
{
"epoch": 5.221043324491601,
"grad_norm": 0.7658723022429813,
"learning_rate": 7.385078155837226e-06,
"loss": 0.4172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2508220672607422,
"step": 2955,
"valid_targets_mean": 3356.6,
"valid_targets_min": 1549
},
{
"epoch": 5.2298850574712645,
"grad_norm": 0.6379179057891206,
"learning_rate": 7.316818160288195e-06,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2654326558113098,
"step": 2960,
"valid_targets_mean": 4930.0,
"valid_targets_min": 447
},
{
"epoch": 5.2387267904509285,
"grad_norm": 0.8198169061308748,
"learning_rate": 7.248804398842322e-06,
"loss": 0.4376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17658288776874542,
"step": 2965,
"valid_targets_mean": 2807.2,
"valid_targets_min": 1191
},
{
"epoch": 5.247568523430592,
"grad_norm": 0.7161368425685732,
"learning_rate": 7.181038191933833e-06,
"loss": 0.3725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23815590143203735,
"step": 2970,
"valid_targets_mean": 3746.0,
"valid_targets_min": 347
},
{
"epoch": 5.256410256410256,
"grad_norm": 0.7383520605352984,
"learning_rate": 7.113520855190907e-06,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17981159687042236,
"step": 2975,
"valid_targets_mean": 2893.6,
"valid_targets_min": 1261
},
{
"epoch": 5.26525198938992,
"grad_norm": 0.7617118383380348,
"learning_rate": 7.046253699410058e-06,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24191364645957947,
"step": 2980,
"valid_targets_mean": 3604.0,
"valid_targets_min": 298
},
{
"epoch": 5.274093722369584,
"grad_norm": 0.761360266153581,
"learning_rate": 6.979238030530775e-06,
"loss": 0.3823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29760921001434326,
"step": 2985,
"valid_targets_mean": 5094.0,
"valid_targets_min": 830
},
{
"epoch": 5.282935455349248,
"grad_norm": 0.6957464522130561,
"learning_rate": 6.912475149610094e-06,
"loss": 0.375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14544111490249634,
"step": 2990,
"valid_targets_mean": 2849.9,
"valid_targets_min": 1018
},
{
"epoch": 5.291777188328912,
"grad_norm": 0.8834015419681706,
"learning_rate": 6.8459663527973995e-06,
"loss": 0.4253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2348986715078354,
"step": 2995,
"valid_targets_mean": 2487.2,
"valid_targets_min": 360
},
{
"epoch": 5.300618921308576,
"grad_norm": 0.7175307826338068,
"learning_rate": 6.779712931309186e-06,
"loss": 0.4069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13426730036735535,
"step": 3000,
"valid_targets_mean": 2886.1,
"valid_targets_min": 1293
},
{
"epoch": 5.30946065428824,
"grad_norm": 0.6263326470511927,
"learning_rate": 6.713716171404086e-06,
"loss": 0.4349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2130982130765915,
"step": 3005,
"valid_targets_mean": 4677.0,
"valid_targets_min": 1091
},
{
"epoch": 5.318302387267904,
"grad_norm": 0.7281926036143173,
"learning_rate": 6.647977354357804e-06,
"loss": 0.4308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22627121210098267,
"step": 3010,
"valid_targets_mean": 2928.8,
"valid_targets_min": 460
},
{
"epoch": 5.327144120247569,
"grad_norm": 0.6832070210761304,
"learning_rate": 6.582497756438326e-06,
"loss": 0.386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27786123752593994,
"step": 3015,
"valid_targets_mean": 4205.2,
"valid_targets_min": 1913
},
{
"epoch": 5.335985853227233,
"grad_norm": 0.7067931683994918,
"learning_rate": 6.517278648881054e-06,
"loss": 0.3716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2012796401977539,
"step": 3020,
"valid_targets_mean": 3926.8,
"valid_targets_min": 1419
},
{
"epoch": 5.344827586206897,
"grad_norm": 1.0101144556395403,
"learning_rate": 6.452321297864212e-06,
"loss": 0.4082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1759074628353119,
"step": 3025,
"valid_targets_mean": 1739.6,
"valid_targets_min": 565
},
{
"epoch": 5.353669319186561,
"grad_norm": 0.6504695714072357,
"learning_rate": 6.387626964484197e-06,
"loss": 0.3963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1815790832042694,
"step": 3030,
"valid_targets_mean": 3034.5,
"valid_targets_min": 260
},
{
"epoch": 5.362511052166225,
"grad_norm": 0.829852685254614,
"learning_rate": 6.323196904731155e-06,
"loss": 0.3854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1513374149799347,
"step": 3035,
"valid_targets_mean": 2116.5,
"valid_targets_min": 769
},
{
"epoch": 5.371352785145889,
"grad_norm": 0.7446352358190379,
"learning_rate": 6.259032369464522e-06,
"loss": 0.3956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27236083149909973,
"step": 3040,
"valid_targets_mean": 3079.9,
"valid_targets_min": 366
},
{
"epoch": 5.380194518125553,
"grad_norm": 0.8228515281616915,
"learning_rate": 6.195134604388819e-06,
"loss": 0.4388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3066047430038452,
"step": 3045,
"valid_targets_mean": 3165.6,
"valid_targets_min": 1862
},
{
"epoch": 5.389036251105217,
"grad_norm": 0.7798826897148097,
"learning_rate": 6.1315048500294125e-06,
"loss": 0.4576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19620686769485474,
"step": 3050,
"valid_targets_mean": 3101.9,
"valid_targets_min": 515
},
{
"epoch": 5.3978779840848805,
"grad_norm": 0.930463249760995,
"learning_rate": 6.068144341708464e-06,
"loss": 0.4117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18991626799106598,
"step": 3055,
"valid_targets_mean": 2486.2,
"valid_targets_min": 287
},
{
"epoch": 5.4067197170645445,
"grad_norm": 0.7704365886141176,
"learning_rate": 6.0050543095209215e-06,
"loss": 0.402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1924263834953308,
"step": 3060,
"valid_targets_mean": 3358.0,
"valid_targets_min": 1254
},
{
"epoch": 5.415561450044208,
"grad_norm": 0.8532428692792394,
"learning_rate": 5.942235978310649e-06,
"loss": 0.4086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22423534095287323,
"step": 3065,
"valid_targets_mean": 3000.2,
"valid_targets_min": 1198
},
{
"epoch": 5.424403183023872,
"grad_norm": 0.669085550320398,
"learning_rate": 5.879690567646645e-06,
"loss": 0.4072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1893330216407776,
"step": 3070,
"valid_targets_mean": 3361.8,
"valid_targets_min": 1890
},
{
"epoch": 5.433244916003536,
"grad_norm": 0.7376176849413955,
"learning_rate": 5.817419291799388e-06,
"loss": 0.4171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16862516105175018,
"step": 3075,
"valid_targets_mean": 3250.4,
"valid_targets_min": 1327
},
{
"epoch": 5.442086648983201,
"grad_norm": 0.6542529886450859,
"learning_rate": 5.755423359717222e-06,
"loss": 0.3953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13393324613571167,
"step": 3080,
"valid_targets_mean": 2877.9,
"valid_targets_min": 559
},
{
"epoch": 5.450928381962865,
"grad_norm": 0.6392677271638753,
"learning_rate": 5.693703975002911e-06,
"loss": 0.4028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13595180213451385,
"step": 3085,
"valid_targets_mean": 2198.1,
"valid_targets_min": 1258
},
{
"epoch": 5.459770114942529,
"grad_norm": 0.8729225649131562,
"learning_rate": 5.632262335890262e-06,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21021749079227448,
"step": 3090,
"valid_targets_mean": 2377.5,
"valid_targets_min": 526
},
{
"epoch": 5.468611847922193,
"grad_norm": 0.6919169604156997,
"learning_rate": 5.571099635220887e-06,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09621213376522064,
"step": 3095,
"valid_targets_mean": 1912.2,
"valid_targets_min": 309
},
{
"epoch": 5.477453580901857,
"grad_norm": 0.9121306344310365,
"learning_rate": 5.510217060421006e-06,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.281181275844574,
"step": 3100,
"valid_targets_mean": 2873.5,
"valid_targets_min": 1299
},
{
"epoch": 5.486295313881521,
"grad_norm": 0.7192489768020969,
"learning_rate": 5.449615793478411e-06,
"loss": 0.4078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16287308931350708,
"step": 3105,
"valid_targets_mean": 3211.4,
"valid_targets_min": 961
},
{
"epoch": 5.495137046861185,
"grad_norm": 0.831717545619796,
"learning_rate": 5.389297010919545e-06,
"loss": 0.4097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19926907122135162,
"step": 3110,
"valid_targets_mean": 2817.5,
"valid_targets_min": 1149
},
{
"epoch": 5.503978779840849,
"grad_norm": 0.8140212742785664,
"learning_rate": 5.329261883786611e-06,
"loss": 0.4226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15885740518569946,
"step": 3115,
"valid_targets_mean": 2335.2,
"valid_targets_min": 514
},
{
"epoch": 5.512820512820513,
"grad_norm": 0.9603182918185311,
"learning_rate": 5.2695115776148765e-06,
"loss": 0.3965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2298716902732849,
"step": 3120,
"valid_targets_mean": 1846.4,
"valid_targets_min": 431
},
{
"epoch": 5.521662245800177,
"grad_norm": 0.8019735181021684,
"learning_rate": 5.21004725241002e-06,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22657175362110138,
"step": 3125,
"valid_targets_mean": 2703.9,
"valid_targets_min": 1080
},
{
"epoch": 5.530503978779841,
"grad_norm": 0.6986863564233587,
"learning_rate": 5.150870062625639e-06,
"loss": 0.3983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12742537260055542,
"step": 3130,
"valid_targets_mean": 2276.5,
"valid_targets_min": 391
},
{
"epoch": 5.539345711759505,
"grad_norm": 0.6392753287000917,
"learning_rate": 5.091981157140808e-06,
"loss": 0.4035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16173365712165833,
"step": 3135,
"valid_targets_mean": 3372.1,
"valid_targets_min": 567
},
{
"epoch": 5.548187444739169,
"grad_norm": 0.6393994411262591,
"learning_rate": 5.03338167923779e-06,
"loss": 0.3976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24456486105918884,
"step": 3140,
"valid_targets_mean": 4942.8,
"valid_targets_min": 1585
},
{
"epoch": 5.5570291777188325,
"grad_norm": 0.6957281925877212,
"learning_rate": 4.975072766579829e-06,
"loss": 0.4048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13130195438861847,
"step": 3145,
"valid_targets_mean": 2417.5,
"valid_targets_min": 344
},
{
"epoch": 5.5658709106984965,
"grad_norm": 0.9301033896027021,
"learning_rate": 4.917055551189089e-06,
"loss": 0.3766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24469897150993347,
"step": 3150,
"valid_targets_mean": 2273.6,
"valid_targets_min": 1133
},
{
"epoch": 5.574712643678161,
"grad_norm": 0.6781134728348155,
"learning_rate": 4.859331159424645e-06,
"loss": 0.3818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16952422261238098,
"step": 3155,
"valid_targets_mean": 3207.5,
"valid_targets_min": 298
},
{
"epoch": 5.583554376657825,
"grad_norm": 0.6976758942726916,
"learning_rate": 4.801900711960628e-06,
"loss": 0.3838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16358278691768646,
"step": 3160,
"valid_targets_mean": 3211.9,
"valid_targets_min": 1839
},
{
"epoch": 5.592396109637489,
"grad_norm": 0.7660887912670873,
"learning_rate": 4.744765323764469e-06,
"loss": 0.4141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2197507917881012,
"step": 3165,
"valid_targets_mean": 2894.8,
"valid_targets_min": 1342
},
{
"epoch": 5.601237842617153,
"grad_norm": 0.7314275252775809,
"learning_rate": 4.6879261040752685e-06,
"loss": 0.3959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14985954761505127,
"step": 3170,
"valid_targets_mean": 2667.5,
"valid_targets_min": 465
},
{
"epoch": 5.610079575596817,
"grad_norm": 0.6999874428567335,
"learning_rate": 4.63138415638223e-06,
"loss": 0.4117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18852269649505615,
"step": 3175,
"valid_targets_mean": 3877.0,
"valid_targets_min": 667
},
{
"epoch": 5.618921308576481,
"grad_norm": 0.7215106059187592,
"learning_rate": 4.575140578403256e-06,
"loss": 0.4084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15598289668560028,
"step": 3180,
"valid_targets_mean": 2837.5,
"valid_targets_min": 247
},
{
"epoch": 5.627763041556145,
"grad_norm": 0.6810403634872003,
"learning_rate": 4.519196462063628e-06,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24649617075920105,
"step": 3185,
"valid_targets_mean": 4866.0,
"valid_targets_min": 503
},
{
"epoch": 5.636604774535809,
"grad_norm": 0.8661083461110505,
"learning_rate": 4.4635528934748315e-06,
"loss": 0.4099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25795987248420715,
"step": 3190,
"valid_targets_mean": 2327.2,
"valid_targets_min": 327
},
{
"epoch": 5.645446507515473,
"grad_norm": 0.9984452335642174,
"learning_rate": 4.408210952913434e-06,
"loss": 0.4076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21475867927074432,
"step": 3195,
"valid_targets_mean": 2365.8,
"valid_targets_min": 523
},
{
"epoch": 5.654288240495137,
"grad_norm": 0.63284420296626,
"learning_rate": 4.353171714800135e-06,
"loss": 0.3617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21914245188236237,
"step": 3200,
"valid_targets_mean": 4543.1,
"valid_targets_min": 1153
},
{
"epoch": 5.663129973474801,
"grad_norm": 0.7215660888800569,
"learning_rate": 4.298436247678892e-06,
"loss": 0.4097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18757544457912445,
"step": 3205,
"valid_targets_mean": 3180.9,
"valid_targets_min": 260
},
{
"epoch": 5.671971706454465,
"grad_norm": 0.8776106727330101,
"learning_rate": 4.2440056141962116e-06,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23493947088718414,
"step": 3210,
"valid_targets_mean": 2881.6,
"valid_targets_min": 329
},
{
"epoch": 5.680813439434129,
"grad_norm": 0.8049825392272455,
"learning_rate": 4.189880871080465e-06,
"loss": 0.4049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13369911909103394,
"step": 3215,
"valid_targets_mean": 3066.9,
"valid_targets_min": 371
},
{
"epoch": 5.689655172413794,
"grad_norm": 0.8302974347090468,
"learning_rate": 4.136063069121412e-06,
"loss": 0.3795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1873476505279541,
"step": 3220,
"valid_targets_mean": 2237.5,
"valid_targets_min": 687
},
{
"epoch": 5.698496905393457,
"grad_norm": 0.6993234633000938,
"learning_rate": 4.082553253149784e-06,
"loss": 0.3919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21738377213478088,
"step": 3225,
"valid_targets_mean": 3679.9,
"valid_targets_min": 1340
},
{
"epoch": 5.7073386383731215,
"grad_norm": 0.9105087640110349,
"learning_rate": 4.029352462017016e-06,
"loss": 0.4019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23904664814472198,
"step": 3230,
"valid_targets_mean": 2628.5,
"valid_targets_min": 778
},
{
"epoch": 5.7161803713527854,
"grad_norm": 0.7887831667909359,
"learning_rate": 3.9764617285750516e-06,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15723231434822083,
"step": 3235,
"valid_targets_mean": 2306.4,
"valid_targets_min": 505
},
{
"epoch": 5.725022104332449,
"grad_norm": 0.8628976638475314,
"learning_rate": 3.923882079656311e-06,
"loss": 0.3979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1998981535434723,
"step": 3240,
"valid_targets_mean": 2389.6,
"valid_targets_min": 368
},
{
"epoch": 5.733863837312113,
"grad_norm": 0.8851868206445387,
"learning_rate": 3.8716145360537516e-06,
"loss": 0.3869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23257210850715637,
"step": 3245,
"valid_targets_mean": 2343.6,
"valid_targets_min": 480
},
{
"epoch": 5.742705570291777,
"grad_norm": 0.7909943609866004,
"learning_rate": 3.819660112501053e-06,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.237594872713089,
"step": 3250,
"valid_targets_mean": 3360.4,
"valid_targets_min": 1582
},
{
"epoch": 5.751547303271441,
"grad_norm": 0.9465551894292238,
"learning_rate": 3.768019817652906e-06,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17449277639389038,
"step": 3255,
"valid_targets_mean": 1845.4,
"valid_targets_min": 668
},
{
"epoch": 5.760389036251105,
"grad_norm": 0.8378732351349432,
"learning_rate": 3.7166946540654403e-06,
"loss": 0.3863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22095929086208344,
"step": 3260,
"valid_targets_mean": 2153.5,
"valid_targets_min": 459
},
{
"epoch": 5.769230769230769,
"grad_norm": 0.7193963936499834,
"learning_rate": 3.6656856181767487e-06,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17883676290512085,
"step": 3265,
"valid_targets_mean": 3431.5,
"valid_targets_min": 778
},
{
"epoch": 5.778072502210433,
"grad_norm": 0.8619394466221819,
"learning_rate": 3.6149937002875725e-06,
"loss": 0.4139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1710013896226883,
"step": 3270,
"valid_targets_mean": 1953.4,
"valid_targets_min": 296
},
{
"epoch": 5.786914235190097,
"grad_norm": 0.7617624941176476,
"learning_rate": 3.564619884542033e-06,
"loss": 0.4073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18097054958343506,
"step": 3275,
"valid_targets_mean": 2563.1,
"valid_targets_min": 1498
},
{
"epoch": 5.795755968169761,
"grad_norm": 0.7210899911422212,
"learning_rate": 3.514565148908553e-06,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21109169721603394,
"step": 3280,
"valid_targets_mean": 3776.4,
"valid_targets_min": 1323
},
{
"epoch": 5.804597701149425,
"grad_norm": 0.8741955579576905,
"learning_rate": 3.4648304651608623e-06,
"loss": 0.3956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17497266829013824,
"step": 3285,
"valid_targets_mean": 2469.2,
"valid_targets_min": 1320
},
{
"epoch": 5.813439434129089,
"grad_norm": 0.7414269383554729,
"learning_rate": 3.4154167988591367e-06,
"loss": 0.3837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15306875109672546,
"step": 3290,
"valid_targets_mean": 2028.0,
"valid_targets_min": 559
},
{
"epoch": 5.822281167108754,
"grad_norm": 0.680343087267019,
"learning_rate": 3.3663251093312477e-06,
"loss": 0.4257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15991319715976715,
"step": 3295,
"valid_targets_mean": 3004.1,
"valid_targets_min": 1060
},
{
"epoch": 5.831122900088418,
"grad_norm": 0.7192829761203814,
"learning_rate": 3.317556349654125e-06,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24054303765296936,
"step": 3300,
"valid_targets_mean": 4578.8,
"valid_targets_min": 867
},
{
"epoch": 5.839964633068082,
"grad_norm": 0.8129183520607333,
"learning_rate": 3.2691114666352887e-06,
"loss": 0.41,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17372924089431763,
"step": 3305,
"valid_targets_mean": 1957.9,
"valid_targets_min": 308
},
{
"epoch": 5.848806366047746,
"grad_norm": 0.6912822577892667,
"learning_rate": 3.220991400794431e-06,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20085839927196503,
"step": 3310,
"valid_targets_mean": 4113.1,
"valid_targets_min": 478
},
{
"epoch": 5.85764809902741,
"grad_norm": 0.7568673476778853,
"learning_rate": 3.1731970863451746e-06,
"loss": 0.3949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16372664272785187,
"step": 3315,
"valid_targets_mean": 2882.0,
"valid_targets_min": 350
},
{
"epoch": 5.8664898320070735,
"grad_norm": 0.8292901753145713,
"learning_rate": 3.1257294511769263e-06,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1919775903224945,
"step": 3320,
"valid_targets_mean": 2993.4,
"valid_targets_min": 409
},
{
"epoch": 5.8753315649867375,
"grad_norm": 0.66874118757708,
"learning_rate": 3.0785894168368857e-06,
"loss": 0.4101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3156202435493469,
"step": 3325,
"valid_targets_mean": 4430.4,
"valid_targets_min": 1275
},
{
"epoch": 5.884173297966401,
"grad_norm": 0.7803502732071088,
"learning_rate": 3.0317778985121182e-06,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17863729596138,
"step": 3330,
"valid_targets_mean": 2628.6,
"valid_targets_min": 262
},
{
"epoch": 5.893015030946065,
"grad_norm": 0.8120192943631549,
"learning_rate": 2.9852958050118275e-06,
"loss": 0.4182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689552515745163,
"step": 3335,
"valid_targets_mean": 3196.8,
"valid_targets_min": 318
},
{
"epoch": 5.901856763925729,
"grad_norm": 0.7503397178701974,
"learning_rate": 2.9391440387496617e-06,
"loss": 0.4242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1889551877975464,
"step": 3340,
"valid_targets_mean": 3213.4,
"valid_targets_min": 363
},
{
"epoch": 5.910698496905393,
"grad_norm": 0.8591198480547091,
"learning_rate": 2.89332349572625e-06,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1662624180316925,
"step": 3345,
"valid_targets_mean": 1885.9,
"valid_targets_min": 543
},
{
"epoch": 5.919540229885057,
"grad_norm": 0.9519020720938417,
"learning_rate": 2.847835065511766e-06,
"loss": 0.3988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17353492975234985,
"step": 3350,
"valid_targets_mean": 1727.4,
"valid_targets_min": 349
},
{
"epoch": 5.928381962864721,
"grad_norm": 0.8747102894127499,
"learning_rate": 2.8026796312286843e-06,
"loss": 0.4373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23620933294296265,
"step": 3355,
"valid_targets_mean": 3666.1,
"valid_targets_min": 1644
},
{
"epoch": 5.937223695844385,
"grad_norm": 0.6376827702661823,
"learning_rate": 2.757858069534598e-06,
"loss": 0.3984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1924460232257843,
"step": 3360,
"valid_targets_mean": 4527.5,
"valid_targets_min": 553
},
{
"epoch": 5.946065428824049,
"grad_norm": 0.6516051452822853,
"learning_rate": 2.71337125060525e-06,
"loss": 0.417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3005494475364685,
"step": 3365,
"valid_targets_mean": 5757.8,
"valid_targets_min": 2223
},
{
"epoch": 5.954907161803714,
"grad_norm": 0.732478020417441,
"learning_rate": 2.669220038117597e-06,
"loss": 0.4419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27111363410949707,
"step": 3370,
"valid_targets_mean": 3390.0,
"valid_targets_min": 458
},
{
"epoch": 5.963748894783378,
"grad_norm": 0.8080636185217684,
"learning_rate": 2.6254052892330737e-06,
"loss": 0.4438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3034144341945648,
"step": 3375,
"valid_targets_mean": 3722.1,
"valid_targets_min": 517
},
{
"epoch": 5.972590627763042,
"grad_norm": 0.7169451114480241,
"learning_rate": 2.5819278545809103e-06,
"loss": 0.4149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27992749214172363,
"step": 3380,
"valid_targets_mean": 3570.2,
"valid_targets_min": 396
},
{
"epoch": 5.981432360742706,
"grad_norm": 0.844425388762182,
"learning_rate": 2.5387885782416712e-06,
"loss": 0.3631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17740076780319214,
"step": 3385,
"valid_targets_mean": 2162.0,
"valid_targets_min": 550
},
{
"epoch": 5.99027409372237,
"grad_norm": 0.6494113116563578,
"learning_rate": 2.495988297730818e-06,
"loss": 0.4035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20014826953411102,
"step": 3390,
"valid_targets_mean": 4345.4,
"valid_targets_min": 438
},
{
"epoch": 5.999115826702034,
"grad_norm": 0.6847608100268655,
"learning_rate": 2.453527843982497e-06,
"loss": 0.3689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28000521659851074,
"step": 3395,
"valid_targets_mean": 5669.8,
"valid_targets_min": 1543
},
{
"epoch": 6.007073386383731,
"grad_norm": 0.7892539431347021,
"learning_rate": 2.4114080413333474e-06,
"loss": 0.3823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21648083627223969,
"step": 3400,
"valid_targets_mean": 3293.4,
"valid_targets_min": 1170
},
{
"epoch": 6.015915119363395,
"grad_norm": 0.7327489748764502,
"learning_rate": 2.369629707506569e-06,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21525824069976807,
"step": 3405,
"valid_targets_mean": 2875.0,
"valid_targets_min": 1100
},
{
"epoch": 6.024756852343059,
"grad_norm": 0.7427914142271864,
"learning_rate": 2.328193653595985e-06,
"loss": 0.3892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29550355672836304,
"step": 3410,
"valid_targets_mean": 3901.6,
"valid_targets_min": 1147
},
{
"epoch": 6.033598585322723,
"grad_norm": 0.7551934122627986,
"learning_rate": 2.2871006840503384e-06,
"loss": 0.385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656990498304367,
"step": 3415,
"valid_targets_mean": 2678.4,
"valid_targets_min": 911
},
{
"epoch": 6.042440318302387,
"grad_norm": 0.8014400239410849,
"learning_rate": 2.2463515966576342e-06,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19182810187339783,
"step": 3420,
"valid_targets_mean": 2418.2,
"valid_targets_min": 415
},
{
"epoch": 6.051282051282051,
"grad_norm": 0.897788988403115,
"learning_rate": 2.2059471825296973e-06,
"loss": 0.3931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26385846734046936,
"step": 3425,
"valid_targets_mean": 2770.5,
"valid_targets_min": 562
},
{
"epoch": 6.060123784261715,
"grad_norm": 0.8149264081278768,
"learning_rate": 2.1658882260867698e-06,
"loss": 0.3711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12121979147195816,
"step": 3430,
"valid_targets_mean": 1847.2,
"valid_targets_min": 1211
},
{
"epoch": 6.068965517241379,
"grad_norm": 0.9058022749241772,
"learning_rate": 2.1261755050423204e-06,
"loss": 0.3914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18681831657886505,
"step": 3435,
"valid_targets_mean": 2502.9,
"valid_targets_min": 294
},
{
"epoch": 6.077807250221043,
"grad_norm": 0.5875487670316494,
"learning_rate": 2.086809790387905e-06,
"loss": 0.3824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14535044133663177,
"step": 3440,
"valid_targets_mean": 3132.5,
"valid_targets_min": 673
},
{
"epoch": 6.086648983200707,
"grad_norm": 0.7952935546054049,
"learning_rate": 2.047791846378242e-06,
"loss": 0.3832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18173527717590332,
"step": 3445,
"valid_targets_mean": 3148.6,
"valid_targets_min": 482
},
{
"epoch": 6.095490716180372,
"grad_norm": 0.7607277089232913,
"learning_rate": 2.009122430516337e-06,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17606256902217865,
"step": 3450,
"valid_targets_mean": 2331.9,
"valid_targets_min": 1478
},
{
"epoch": 6.104332449160036,
"grad_norm": 0.7496258419853713,
"learning_rate": 1.970802293538807e-06,
"loss": 0.3777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27735546231269836,
"step": 3455,
"valid_targets_mean": 4273.4,
"valid_targets_min": 1153
},
{
"epoch": 6.1131741821397,
"grad_norm": 0.6985174849382113,
"learning_rate": 1.9328321794012762e-06,
"loss": 0.3882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2295549213886261,
"step": 3460,
"valid_targets_mean": 3212.6,
"valid_targets_min": 358
},
{
"epoch": 6.122015915119364,
"grad_norm": 0.6160591675123345,
"learning_rate": 1.895212825263959e-06,
"loss": 0.3912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.262872576713562,
"step": 3465,
"valid_targets_mean": 6619.6,
"valid_targets_min": 1010
},
{
"epoch": 6.130857648099028,
"grad_norm": 0.8207914026042112,
"learning_rate": 1.8579449614773314e-06,
"loss": 0.3729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13713327050209045,
"step": 3470,
"valid_targets_mean": 1882.8,
"valid_targets_min": 591
},
{
"epoch": 6.1396993810786915,
"grad_norm": 0.8071469248304369,
"learning_rate": 1.8210293115679677e-06,
"loss": 0.4061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2146981954574585,
"step": 3475,
"valid_targets_mean": 3234.0,
"valid_targets_min": 559
},
{
"epoch": 6.1485411140583555,
"grad_norm": 0.6897319556110078,
"learning_rate": 1.784466592224472e-06,
"loss": 0.3966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13424663245677948,
"step": 3480,
"valid_targets_mean": 2311.5,
"valid_targets_min": 676
},
{
"epoch": 6.157382847038019,
"grad_norm": 0.729819719486692,
"learning_rate": 1.74825751328358e-06,
"loss": 0.3926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19196979701519012,
"step": 3485,
"valid_targets_mean": 3340.2,
"valid_targets_min": 554
},
{
"epoch": 6.166224580017683,
"grad_norm": 0.8426168349719839,
"learning_rate": 1.7124027777163732e-06,
"loss": 0.4201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14435023069381714,
"step": 3490,
"valid_targets_mean": 1912.6,
"valid_targets_min": 319
},
{
"epoch": 6.175066312997347,
"grad_norm": 0.759757715201301,
"learning_rate": 1.6769030816146404e-06,
"loss": 0.3965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22856047749519348,
"step": 3495,
"valid_targets_mean": 3739.8,
"valid_targets_min": 924
},
{
"epoch": 6.183908045977011,
"grad_norm": 0.8366056994371286,
"learning_rate": 1.6417591141773458e-06,
"loss": 0.4146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17554280161857605,
"step": 3500,
"valid_targets_mean": 2551.6,
"valid_targets_min": 529
},
{
"epoch": 6.192749778956675,
"grad_norm": 0.7980312027283708,
"learning_rate": 1.6069715576972634e-06,
"loss": 0.3904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27862659096717834,
"step": 3505,
"valid_targets_mean": 3707.2,
"valid_targets_min": 1715
},
{
"epoch": 6.201591511936339,
"grad_norm": 0.7364325995709389,
"learning_rate": 1.5725410875477187e-06,
"loss": 0.3608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1674642115831375,
"step": 3510,
"valid_targets_mean": 2912.5,
"valid_targets_min": 263
},
{
"epoch": 6.210433244916003,
"grad_norm": 0.8858927969586514,
"learning_rate": 1.5384683721694993e-06,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18463276326656342,
"step": 3515,
"valid_targets_mean": 2316.4,
"valid_targets_min": 715
},
{
"epoch": 6.219274977895668,
"grad_norm": 0.8919860695858821,
"learning_rate": 1.504754073057846e-06,
"loss": 0.4015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19577711820602417,
"step": 3520,
"valid_targets_mean": 1823.4,
"valid_targets_min": 384
},
{
"epoch": 6.228116710875332,
"grad_norm": 0.8455766242568858,
"learning_rate": 1.4713988447496342e-06,
"loss": 0.4037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19854457676410675,
"step": 3525,
"valid_targets_mean": 2662.8,
"valid_targets_min": 608
},
{
"epoch": 6.236958443854996,
"grad_norm": 0.744453900421472,
"learning_rate": 1.438403334810663e-06,
"loss": 0.3768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15537121891975403,
"step": 3530,
"valid_targets_mean": 2982.4,
"valid_targets_min": 2031
},
{
"epoch": 6.24580017683466,
"grad_norm": 0.8827206937052091,
"learning_rate": 1.405768183823073e-06,
"loss": 0.3864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19907264411449432,
"step": 3535,
"valid_targets_mean": 2362.4,
"valid_targets_min": 452
},
{
"epoch": 6.254641909814324,
"grad_norm": 0.8416510383985708,
"learning_rate": 1.3734940253729167e-06,
"loss": 0.3777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22170794010162354,
"step": 3540,
"valid_targets_mean": 3408.8,
"valid_targets_min": 293
},
{
"epoch": 6.263483642793988,
"grad_norm": 0.7873873101117113,
"learning_rate": 1.3415814860378573e-06,
"loss": 0.3766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14214427769184113,
"step": 3545,
"valid_targets_mean": 2900.8,
"valid_targets_min": 394
},
{
"epoch": 6.272325375773652,
"grad_norm": 0.7347622266646417,
"learning_rate": 1.3100311853750114e-06,
"loss": 0.4088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.152814120054245,
"step": 3550,
"valid_targets_mean": 2783.9,
"valid_targets_min": 780
},
{
"epoch": 6.281167108753316,
"grad_norm": 0.8638119930741502,
"learning_rate": 1.2788437359089056e-06,
"loss": 0.3869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2797715365886688,
"step": 3555,
"valid_targets_mean": 3625.0,
"valid_targets_min": 1228
},
{
"epoch": 6.29000884173298,
"grad_norm": 0.7458458853206296,
"learning_rate": 1.248019743119595e-06,
"loss": 0.3677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2126968950033188,
"step": 3560,
"valid_targets_mean": 3209.9,
"valid_targets_min": 275
},
{
"epoch": 6.2988505747126435,
"grad_norm": 0.7013433868816651,
"learning_rate": 1.2175598054309058e-06,
"loss": 0.3637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24043208360671997,
"step": 3565,
"valid_targets_mean": 4891.2,
"valid_targets_min": 711
},
{
"epoch": 6.3076923076923075,
"grad_norm": 0.7155286710184046,
"learning_rate": 1.187464514198824e-06,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22147774696350098,
"step": 3570,
"valid_targets_mean": 3511.0,
"valid_targets_min": 661
},
{
"epoch": 6.316534040671971,
"grad_norm": 0.8942958090189175,
"learning_rate": 1.1577344537000012e-06,
"loss": 0.3619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24931302666664124,
"step": 3575,
"valid_targets_mean": 3223.0,
"valid_targets_min": 1451
},
{
"epoch": 6.325375773651635,
"grad_norm": 0.8019003945889316,
"learning_rate": 1.128370201120419e-06,
"loss": 0.4175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2635502517223358,
"step": 3580,
"valid_targets_mean": 3202.5,
"valid_targets_min": 1373
},
{
"epoch": 6.334217506631299,
"grad_norm": 0.6817340392127685,
"learning_rate": 1.0993723265441835e-06,
"loss": 0.3823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13677793741226196,
"step": 3585,
"valid_targets_mean": 2905.6,
"valid_targets_min": 1394
},
{
"epoch": 6.343059239610964,
"grad_norm": 0.6095420535867488,
"learning_rate": 1.0707413929424626e-06,
"loss": 0.415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17292746901512146,
"step": 3590,
"valid_targets_mean": 3958.5,
"valid_targets_min": 2560
},
{
"epoch": 6.351900972590628,
"grad_norm": 0.6319517497546866,
"learning_rate": 1.0424779561625465e-06,
"loss": 0.3905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15072670578956604,
"step": 3595,
"valid_targets_mean": 3169.4,
"valid_targets_min": 981
},
{
"epoch": 6.360742705570292,
"grad_norm": 0.806370402271801,
"learning_rate": 1.0145825649170593e-06,
"loss": 0.4086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2352861762046814,
"step": 3600,
"valid_targets_mean": 2252.2,
"valid_targets_min": 323
},
{
"epoch": 6.369584438549956,
"grad_norm": 0.6699724587109076,
"learning_rate": 9.870557607733056e-07,
"loss": 0.3799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16308927536010742,
"step": 3605,
"valid_targets_mean": 3615.8,
"valid_targets_min": 415
},
{
"epoch": 6.37842617152962,
"grad_norm": 0.827228282016501,
"learning_rate": 9.59898078142767e-07,
"loss": 0.4035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2147194743156433,
"step": 3610,
"valid_targets_mean": 2595.4,
"valid_targets_min": 491
},
{
"epoch": 6.387267904509284,
"grad_norm": 0.6652223634579235,
"learning_rate": 9.331100442707108e-07,
"loss": 0.4052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17819935083389282,
"step": 3615,
"valid_targets_mean": 3927.1,
"valid_targets_min": 979
},
{
"epoch": 6.396109637488948,
"grad_norm": 0.7289789412288719,
"learning_rate": 9.066921792259654e-07,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18159447610378265,
"step": 3620,
"valid_targets_mean": 3477.9,
"valid_targets_min": 363
},
{
"epoch": 6.404951370468612,
"grad_norm": 0.6396828577240828,
"learning_rate": 8.806449958908115e-07,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22703109681606293,
"step": 3625,
"valid_targets_mean": 5019.6,
"valid_targets_min": 1272
},
{
"epoch": 6.413793103448276,
"grad_norm": 0.8721346570560746,
"learning_rate": 8.549689999510446e-07,
"loss": 0.3822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23551982641220093,
"step": 3630,
"valid_targets_mean": 2339.8,
"valid_targets_min": 431
},
{
"epoch": 6.42263483642794,
"grad_norm": 0.6947586156644703,
"learning_rate": 8.296646898861405e-07,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16428089141845703,
"step": 3635,
"valid_targets_mean": 3315.1,
"valid_targets_min": 706
},
{
"epoch": 6.431476569407604,
"grad_norm": 0.7795433915349836,
"learning_rate": 8.047325569595821e-07,
"loss": 0.3883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1826629936695099,
"step": 3640,
"valid_targets_mean": 2893.4,
"valid_targets_min": 458
},
{
"epoch": 6.440318302387268,
"grad_norm": 0.6984355115855847,
"learning_rate": 7.801730852093193e-07,
"loss": 0.4044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21642327308654785,
"step": 3645,
"valid_targets_mean": 3958.0,
"valid_targets_min": 435
},
{
"epoch": 6.449160035366932,
"grad_norm": 1.0772469112743712,
"learning_rate": 7.559867514383867e-07,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2273642122745514,
"step": 3650,
"valid_targets_mean": 3464.5,
"valid_targets_min": 565
},
{
"epoch": 6.458001768346596,
"grad_norm": 0.8907493802415359,
"learning_rate": 7.321740252056253e-07,
"loss": 0.4066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19292961061000824,
"step": 3655,
"valid_targets_mean": 2551.0,
"valid_targets_min": 358
},
{
"epoch": 6.4668435013262595,
"grad_norm": 0.8209923973422765,
"learning_rate": 7.087353688165776e-07,
"loss": 0.4453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1861528754234314,
"step": 3660,
"valid_targets_mean": 2526.1,
"valid_targets_min": 577
},
{
"epoch": 6.475685234305924,
"grad_norm": 0.7474743887332304,
"learning_rate": 6.856712373145158e-07,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22273015975952148,
"step": 3665,
"valid_targets_mean": 2730.5,
"valid_targets_min": 328
},
{
"epoch": 6.484526967285588,
"grad_norm": 0.7947503636901528,
"learning_rate": 6.62982078471599e-07,
"loss": 0.399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3024711310863495,
"step": 3670,
"valid_targets_mean": 4017.4,
"valid_targets_min": 826
},
{
"epoch": 6.493368700265252,
"grad_norm": 0.8974195325023576,
"learning_rate": 6.406683327801877e-07,
"loss": 0.3775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1381479799747467,
"step": 3675,
"valid_targets_mean": 1530.0,
"valid_targets_min": 406
},
{
"epoch": 6.502210433244916,
"grad_norm": 0.7191615989293343,
"learning_rate": 6.187304334442856e-07,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1408117115497589,
"step": 3680,
"valid_targets_mean": 3383.2,
"valid_targets_min": 736
},
{
"epoch": 6.51105216622458,
"grad_norm": 0.9329960975796369,
"learning_rate": 5.97168806371129e-07,
"loss": 0.3798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2396770715713501,
"step": 3685,
"valid_targets_mean": 2167.9,
"valid_targets_min": 769
},
{
"epoch": 6.519893899204244,
"grad_norm": 0.6478034299508139,
"learning_rate": 5.759838701629284e-07,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18991714715957642,
"step": 3690,
"valid_targets_mean": 3872.1,
"valid_targets_min": 1687
},
{
"epoch": 6.528735632183908,
"grad_norm": 0.665389821538992,
"learning_rate": 5.551760361087288e-07,
"loss": 0.3781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20422768592834473,
"step": 3695,
"valid_targets_mean": 3974.6,
"valid_targets_min": 1072
},
{
"epoch": 6.537577365163572,
"grad_norm": 0.8481964209332128,
"learning_rate": 5.347457081764318e-07,
"loss": 0.387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12965896725654602,
"step": 3700,
"valid_targets_mean": 2102.9,
"valid_targets_min": 547
},
{
"epoch": 6.546419098143236,
"grad_norm": 0.7959235784114853,
"learning_rate": 5.146932830049545e-07,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13871905207633972,
"step": 3705,
"valid_targets_mean": 2381.4,
"valid_targets_min": 416
},
{
"epoch": 6.5552608311229,
"grad_norm": 0.9738963676820827,
"learning_rate": 4.950191498965207e-07,
"loss": 0.391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24106061458587646,
"step": 3710,
"valid_targets_mean": 2475.1,
"valid_targets_min": 958
},
{
"epoch": 6.564102564102564,
"grad_norm": 0.6979946706582677,
"learning_rate": 4.7572369080910897e-07,
"loss": 0.402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.283669114112854,
"step": 3715,
"valid_targets_mean": 3481.0,
"valid_targets_min": 515
},
{
"epoch": 6.572944297082228,
"grad_norm": 0.8704935577886896,
"learning_rate": 4.568072803490409e-07,
"loss": 0.4178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18020617961883545,
"step": 3720,
"valid_targets_mean": 2580.9,
"valid_targets_min": 609
},
{
"epoch": 6.581786030061892,
"grad_norm": 0.7804746793990116,
"learning_rate": 4.382702857637022e-07,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17412936687469482,
"step": 3725,
"valid_targets_mean": 3689.2,
"valid_targets_min": 378
},
{
"epoch": 6.590627763041557,
"grad_norm": 0.8487934940824559,
"learning_rate": 4.2011306693441554e-07,
"loss": 0.4013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24455024302005768,
"step": 3730,
"valid_targets_mean": 2609.2,
"valid_targets_min": 657
},
{
"epoch": 6.59946949602122,
"grad_norm": 0.6852406296840956,
"learning_rate": 4.0233597636944565e-07,
"loss": 0.3904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19759978353977203,
"step": 3735,
"valid_targets_mean": 3594.5,
"valid_targets_min": 438
},
{
"epoch": 6.6083112290008845,
"grad_norm": 0.7416508492161489,
"learning_rate": 3.84939359197174e-07,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.138950914144516,
"step": 3740,
"valid_targets_mean": 2434.2,
"valid_targets_min": 283
},
{
"epoch": 6.6171529619805485,
"grad_norm": 0.8357824054733599,
"learning_rate": 3.6792355315937947e-07,
"loss": 0.3735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19350282847881317,
"step": 3745,
"valid_targets_mean": 2571.5,
"valid_targets_min": 1450
},
{
"epoch": 6.625994694960212,
"grad_norm": 0.8587156622200902,
"learning_rate": 3.5128888860468836e-07,
"loss": 0.3885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22190819680690765,
"step": 3750,
"valid_targets_mean": 3109.5,
"valid_targets_min": 339
},
{
"epoch": 6.634836427939876,
"grad_norm": 0.6581213951003092,
"learning_rate": 3.350356884821748e-07,
"loss": 0.4011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21432948112487793,
"step": 3755,
"valid_targets_mean": 3528.0,
"valid_targets_min": 635
},
{
"epoch": 6.64367816091954,
"grad_norm": 0.8286218218972864,
"learning_rate": 3.191642683350571e-07,
"loss": 0.3918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32919830083847046,
"step": 3760,
"valid_targets_mean": 4206.6,
"valid_targets_min": 560
},
{
"epoch": 6.652519893899204,
"grad_norm": 0.7950121098953326,
"learning_rate": 3.036749362946112e-07,
"loss": 0.388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18096879124641418,
"step": 3765,
"valid_targets_mean": 2454.1,
"valid_targets_min": 480
},
{
"epoch": 6.661361626878868,
"grad_norm": 0.7940166037642752,
"learning_rate": 2.8856799307415807e-07,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14865876734256744,
"step": 3770,
"valid_targets_mean": 2513.9,
"valid_targets_min": 888
},
{
"epoch": 6.670203359858532,
"grad_norm": 0.7495945684460611,
"learning_rate": 2.7384373196324365e-07,
"loss": 0.3681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11169509589672089,
"step": 3775,
"valid_targets_mean": 2019.8,
"valid_targets_min": 563
},
{
"epoch": 6.679045092838196,
"grad_norm": 0.711551778287024,
"learning_rate": 2.595024388219347e-07,
"loss": 0.3841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22360673546791077,
"step": 3780,
"valid_targets_mean": 3386.1,
"valid_targets_min": 459
},
{
"epoch": 6.68788682581786,
"grad_norm": 0.7177246883491567,
"learning_rate": 2.4554439207527424e-07,
"loss": 0.3825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19970688223838806,
"step": 3785,
"valid_targets_mean": 4797.1,
"valid_targets_min": 1729
},
{
"epoch": 6.696728558797524,
"grad_norm": 0.7780793009957203,
"learning_rate": 2.3196986270787704e-07,
"loss": 0.4226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3514820635318756,
"step": 3790,
"valid_targets_mean": 4338.2,
"valid_targets_min": 1681
},
{
"epoch": 6.705570291777188,
"grad_norm": 0.7174415720541817,
"learning_rate": 2.1877911425866705e-07,
"loss": 0.3864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15473148226737976,
"step": 3795,
"valid_targets_mean": 2806.8,
"valid_targets_min": 362
},
{
"epoch": 6.714412024756852,
"grad_norm": 0.6743683915959348,
"learning_rate": 2.059724028157506e-07,
"loss": 0.3834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16321048140525818,
"step": 3800,
"valid_targets_mean": 3285.9,
"valid_targets_min": 341
},
{
"epoch": 6.723253757736517,
"grad_norm": 0.7217029334413514,
"learning_rate": 1.9354997701146904e-07,
"loss": 0.3951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24354010820388794,
"step": 3805,
"valid_targets_mean": 3629.1,
"valid_targets_min": 1637
},
{
"epoch": 6.732095490716181,
"grad_norm": 0.7644466171909563,
"learning_rate": 1.8151207801754722e-07,
"loss": 0.4429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22783520817756653,
"step": 3810,
"valid_targets_mean": 3151.8,
"valid_targets_min": 679
},
{
"epoch": 6.740937223695845,
"grad_norm": 0.697996637149306,
"learning_rate": 1.6985893954042598e-07,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34702497720718384,
"step": 3815,
"valid_targets_mean": 5219.4,
"valid_targets_min": 661
},
{
"epoch": 6.749778956675509,
"grad_norm": 0.6524281262476507,
"learning_rate": 1.5859078781671477e-07,
"loss": 0.3758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16086144745349884,
"step": 3820,
"valid_targets_mean": 3767.5,
"valid_targets_min": 1390
},
{
"epoch": 6.758620689655173,
"grad_norm": 0.8703374924931297,
"learning_rate": 1.477078416088107e-07,
"loss": 0.383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.157963365316391,
"step": 3825,
"valid_targets_mean": 2099.6,
"valid_targets_min": 703
},
{
"epoch": 6.7674624226348365,
"grad_norm": 0.9150276768989083,
"learning_rate": 1.3721031220064185e-07,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20869338512420654,
"step": 3830,
"valid_targets_mean": 2169.6,
"valid_targets_min": 769
},
{
"epoch": 6.7763041556145005,
"grad_norm": 0.8582742028385791,
"learning_rate": 1.2709840339357515e-07,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1651896834373474,
"step": 3835,
"valid_targets_mean": 1981.6,
"valid_targets_min": 281
},
{
"epoch": 6.7851458885941645,
"grad_norm": 0.8933135468827135,
"learning_rate": 1.1737231150244388e-07,
"loss": 0.383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16246512532234192,
"step": 3840,
"valid_targets_mean": 2891.0,
"valid_targets_min": 542
},
{
"epoch": 6.793987621573828,
"grad_norm": 0.8039369028796995,
"learning_rate": 1.0803222535175295e-07,
"loss": 0.3603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12738923728466034,
"step": 3845,
"valid_targets_mean": 2474.1,
"valid_targets_min": 458
},
{
"epoch": 6.802829354553492,
"grad_norm": 0.800841966247947,
"learning_rate": 9.907832627200631e-08,
"loss": 0.3988,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19415853917598724,
"step": 3850,
"valid_targets_mean": 2828.2,
"valid_targets_min": 1638
},
{
"epoch": 6.811671087533156,
"grad_norm": 0.7602967171940971,
"learning_rate": 9.051078809618752e-08,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29658013582229614,
"step": 3855,
"valid_targets_mean": 4289.4,
"valid_targets_min": 1496
},
{
"epoch": 6.82051282051282,
"grad_norm": 0.6866320695142892,
"learning_rate": 8.232977715637358e-08,
"loss": 0.3803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22931569814682007,
"step": 3860,
"valid_targets_mean": 5008.4,
"valid_targets_min": 406
},
{
"epoch": 6.829354553492484,
"grad_norm": 0.8047620480314491,
"learning_rate": 7.453545228053305e-08,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17397227883338928,
"step": 3865,
"valid_targets_mean": 2955.0,
"valid_targets_min": 544
},
{
"epoch": 6.838196286472148,
"grad_norm": 0.7586490896107623,
"learning_rate": 6.712796478940853e-08,
"loss": 0.4068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16233235597610474,
"step": 3870,
"valid_targets_mean": 2807.6,
"valid_targets_min": 372
},
{
"epoch": 6.847038019451812,
"grad_norm": 0.6581619537458464,
"learning_rate": 6.010745849361011e-08,
"loss": 0.3891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133625328540802,
"step": 3875,
"valid_targets_mean": 4207.5,
"valid_targets_min": 275
},
{
"epoch": 6.855879752431477,
"grad_norm": 0.7436096405016829,
"learning_rate": 5.347406969079982e-08,
"loss": 0.417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1265230029821396,
"step": 3880,
"valid_targets_mean": 2987.5,
"valid_targets_min": 346
},
{
"epoch": 6.864721485411141,
"grad_norm": 0.7763730599939348,
"learning_rate": 4.722792716306046e-08,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20675580203533173,
"step": 3885,
"valid_targets_mean": 3732.2,
"valid_targets_min": 1566
},
{
"epoch": 6.873563218390805,
"grad_norm": 0.7715820038607789,
"learning_rate": 4.1369152174381975e-08,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21535265445709229,
"step": 3890,
"valid_targets_mean": 3796.9,
"valid_targets_min": 674
},
{
"epoch": 6.882404951370469,
"grad_norm": 0.9019028296801088,
"learning_rate": 3.589785846832783e-08,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20554758608341217,
"step": 3895,
"valid_targets_mean": 2699.5,
"valid_targets_min": 889
},
{
"epoch": 6.891246684350133,
"grad_norm": 0.7944162594852624,
"learning_rate": 3.081415226579898e-08,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15075156092643738,
"step": 3900,
"valid_targets_mean": 2368.2,
"valid_targets_min": 783
},
{
"epoch": 6.900088417329797,
"grad_norm": 0.7617097376400151,
"learning_rate": 2.6118132263002193e-08,
"loss": 0.3851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1630379855632782,
"step": 3905,
"valid_targets_mean": 3169.9,
"valid_targets_min": 378
},
{
"epoch": 6.908930150309461,
"grad_norm": 0.7539821586393874,
"learning_rate": 2.18098896295027e-08,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14324209094047546,
"step": 3910,
"valid_targets_mean": 2474.1,
"valid_targets_min": 680
},
{
"epoch": 6.917771883289125,
"grad_norm": 0.797486908920383,
"learning_rate": 1.788950800648337e-08,
"loss": 0.3883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1615052968263626,
"step": 3915,
"valid_targets_mean": 2934.4,
"valid_targets_min": 354
},
{
"epoch": 6.926613616268789,
"grad_norm": 0.7651379607020341,
"learning_rate": 1.4357063505101576e-08,
"loss": 0.4133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14266857504844666,
"step": 3920,
"valid_targets_mean": 2230.8,
"valid_targets_min": 395
},
{
"epoch": 6.9354553492484525,
"grad_norm": 0.7502594071352197,
"learning_rate": 1.1212624705014829e-08,
"loss": 0.4242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.321631520986557,
"step": 3925,
"valid_targets_mean": 3950.1,
"valid_targets_min": 335
},
{
"epoch": 6.9442970822281165,
"grad_norm": 0.6647778859131394,
"learning_rate": 8.456252653055164e-09,
"loss": 0.4284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23882895708084106,
"step": 3930,
"valid_targets_mean": 3747.4,
"valid_targets_min": 556
},
{
"epoch": 6.95313881520778,
"grad_norm": 0.6155232006040645,
"learning_rate": 6.08800086204342e-09,
"loss": 0.3761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1027369350194931,
"step": 3935,
"valid_targets_mean": 3219.8,
"valid_targets_min": 1858
},
{
"epoch": 6.961980548187444,
"grad_norm": 0.9711608387054405,
"learning_rate": 4.107915309743416e-09,
"loss": 0.4059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.190896674990654,
"step": 3940,
"valid_targets_mean": 2195.4,
"valid_targets_min": 362
},
{
"epoch": 6.970822281167109,
"grad_norm": 0.7122188828888222,
"learning_rate": 2.516034437973769e-09,
"loss": 0.4263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21069204807281494,
"step": 3945,
"valid_targets_mean": 3195.0,
"valid_targets_min": 411
},
{
"epoch": 6.979664014146772,
"grad_norm": 0.7376023644733862,
"learning_rate": 1.312389151861826e-09,
"loss": 0.4027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25383979082107544,
"step": 3950,
"valid_targets_mean": 3817.6,
"valid_targets_min": 1252
},
{
"epoch": 6.988505747126437,
"grad_norm": 0.627582373951346,
"learning_rate": 4.970028192485821e-10,
"loss": 0.4011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1778397411108017,
"step": 3955,
"valid_targets_mean": 3882.2,
"valid_targets_min": 411
},
{
"epoch": 6.997347480106101,
"grad_norm": 0.7920130024563453,
"learning_rate": 6.989127021794773e-11,
"loss": 0.392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20227769017219543,
"step": 3960,
"valid_targets_mean": 2815.9,
"valid_targets_min": 305
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.48488524556159973,
"step": 3962,
"total_flos": 9.02500960062931e+17,
"train_loss": 0.468742822619895,
"train_runtime": 33154.24,
"train_samples_per_second": 1.91,
"train_steps_per_second": 0.12,
"valid_targets_mean": 3460.0,
"valid_targets_min": 1632
}
],
"logging_steps": 5,
"max_steps": 3962,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 9.02500960062931e+17,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}