9981 lines
277 KiB
JSON
9981 lines
277 KiB
JSON
{
|
|
"best_global_step": null,
|
|
"best_metric": null,
|
|
"best_model_checkpoint": null,
|
|
"epoch": 7.0,
|
|
"eval_steps": 500,
|
|
"global_step": 4515,
|
|
"is_hyper_param_search": false,
|
|
"is_local_process_zero": true,
|
|
"is_world_process_zero": true,
|
|
"log_history": [
|
|
{
|
|
"epoch": 0.007751937984496124,
|
|
"grad_norm": 10.737414411251518,
|
|
"learning_rate": 3.5398230088495575e-07,
|
|
"loss": 0.6122,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.5790383219718933,
|
|
"step": 5,
|
|
"valid_targets_mean": 5473.9,
|
|
"valid_targets_min": 2003
|
|
},
|
|
{
|
|
"epoch": 0.015503875968992248,
|
|
"grad_norm": 12.969006644336845,
|
|
"learning_rate": 7.964601769911505e-07,
|
|
"loss": 0.6056,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.6179184317588806,
|
|
"step": 10,
|
|
"valid_targets_mean": 4275.1,
|
|
"valid_targets_min": 2399
|
|
},
|
|
{
|
|
"epoch": 0.023255813953488372,
|
|
"grad_norm": 10.73852678993892,
|
|
"learning_rate": 1.2389380530973452e-06,
|
|
"loss": 0.6059,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.6460979580879211,
|
|
"step": 15,
|
|
"valid_targets_mean": 5231.6,
|
|
"valid_targets_min": 343
|
|
},
|
|
{
|
|
"epoch": 0.031007751937984496,
|
|
"grad_norm": 10.022340877272923,
|
|
"learning_rate": 1.68141592920354e-06,
|
|
"loss": 0.5736,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.5392199158668518,
|
|
"step": 20,
|
|
"valid_targets_mean": 5241.8,
|
|
"valid_targets_min": 310
|
|
},
|
|
{
|
|
"epoch": 0.03875968992248062,
|
|
"grad_norm": 5.037849526968358,
|
|
"learning_rate": 2.1238938053097345e-06,
|
|
"loss": 0.4978,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3818526268005371,
|
|
"step": 25,
|
|
"valid_targets_mean": 5527.9,
|
|
"valid_targets_min": 614
|
|
},
|
|
{
|
|
"epoch": 0.046511627906976744,
|
|
"grad_norm": 4.262678982312242,
|
|
"learning_rate": 2.5663716814159294e-06,
|
|
"loss": 0.5324,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.6495624780654907,
|
|
"step": 30,
|
|
"valid_targets_mean": 3715.2,
|
|
"valid_targets_min": 408
|
|
},
|
|
{
|
|
"epoch": 0.05426356589147287,
|
|
"grad_norm": 2.3482137938148466,
|
|
"learning_rate": 3.0088495575221242e-06,
|
|
"loss": 0.4639,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.5476200580596924,
|
|
"step": 35,
|
|
"valid_targets_mean": 5361.5,
|
|
"valid_targets_min": 2437
|
|
},
|
|
{
|
|
"epoch": 0.06201550387596899,
|
|
"grad_norm": 1.46476205992856,
|
|
"learning_rate": 3.4513274336283186e-06,
|
|
"loss": 0.4293,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.46131038665771484,
|
|
"step": 40,
|
|
"valid_targets_mean": 5086.5,
|
|
"valid_targets_min": 272
|
|
},
|
|
{
|
|
"epoch": 0.06976744186046512,
|
|
"grad_norm": 1.3283216378548661,
|
|
"learning_rate": 3.8938053097345135e-06,
|
|
"loss": 0.4646,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.44244861602783203,
|
|
"step": 45,
|
|
"valid_targets_mean": 3978.5,
|
|
"valid_targets_min": 1865
|
|
},
|
|
{
|
|
"epoch": 0.07751937984496124,
|
|
"grad_norm": 1.0028919580355764,
|
|
"learning_rate": 4.336283185840709e-06,
|
|
"loss": 0.4339,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.4484736919403076,
|
|
"step": 50,
|
|
"valid_targets_mean": 5080.6,
|
|
"valid_targets_min": 2468
|
|
},
|
|
{
|
|
"epoch": 0.08527131782945736,
|
|
"grad_norm": 0.8265483597929661,
|
|
"learning_rate": 4.778761061946903e-06,
|
|
"loss": 0.3985,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.43008673191070557,
|
|
"step": 55,
|
|
"valid_targets_mean": 4308.8,
|
|
"valid_targets_min": 598
|
|
},
|
|
{
|
|
"epoch": 0.09302325581395349,
|
|
"grad_norm": 0.7109955989422742,
|
|
"learning_rate": 5.2212389380530985e-06,
|
|
"loss": 0.3726,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.34888190031051636,
|
|
"step": 60,
|
|
"valid_targets_mean": 4633.4,
|
|
"valid_targets_min": 2442
|
|
},
|
|
{
|
|
"epoch": 0.10077519379844961,
|
|
"grad_norm": 0.655988135659704,
|
|
"learning_rate": 5.663716814159292e-06,
|
|
"loss": 0.3799,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.34532463550567627,
|
|
"step": 65,
|
|
"valid_targets_mean": 3801.8,
|
|
"valid_targets_min": 299
|
|
},
|
|
{
|
|
"epoch": 0.10852713178294573,
|
|
"grad_norm": 0.5932763195572598,
|
|
"learning_rate": 6.1061946902654865e-06,
|
|
"loss": 0.3585,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.32048162817955017,
|
|
"step": 70,
|
|
"valid_targets_mean": 4474.1,
|
|
"valid_targets_min": 1430
|
|
},
|
|
{
|
|
"epoch": 0.11627906976744186,
|
|
"grad_norm": 0.5372600166593284,
|
|
"learning_rate": 6.548672566371682e-06,
|
|
"loss": 0.3061,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3458303213119507,
|
|
"step": 75,
|
|
"valid_targets_mean": 5349.9,
|
|
"valid_targets_min": 2632
|
|
},
|
|
{
|
|
"epoch": 0.12403100775193798,
|
|
"grad_norm": 0.5539936993292226,
|
|
"learning_rate": 6.991150442477876e-06,
|
|
"loss": 0.357,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3393269181251526,
|
|
"step": 80,
|
|
"valid_targets_mean": 4613.9,
|
|
"valid_targets_min": 642
|
|
},
|
|
{
|
|
"epoch": 0.13178294573643412,
|
|
"grad_norm": 0.5623006682180124,
|
|
"learning_rate": 7.4336283185840714e-06,
|
|
"loss": 0.348,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.37088829278945923,
|
|
"step": 85,
|
|
"valid_targets_mean": 5265.9,
|
|
"valid_targets_min": 2035
|
|
},
|
|
{
|
|
"epoch": 0.13953488372093023,
|
|
"grad_norm": 0.5992837863592103,
|
|
"learning_rate": 7.876106194690266e-06,
|
|
"loss": 0.3268,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.35172638297080994,
|
|
"step": 90,
|
|
"valid_targets_mean": 4771.9,
|
|
"valid_targets_min": 1048
|
|
},
|
|
{
|
|
"epoch": 0.14728682170542637,
|
|
"grad_norm": 0.45192427418479936,
|
|
"learning_rate": 8.31858407079646e-06,
|
|
"loss": 0.3372,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3198494017124176,
|
|
"step": 95,
|
|
"valid_targets_mean": 5918.0,
|
|
"valid_targets_min": 368
|
|
},
|
|
{
|
|
"epoch": 0.15503875968992248,
|
|
"grad_norm": 0.625926887246749,
|
|
"learning_rate": 8.761061946902656e-06,
|
|
"loss": 0.3209,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.40857595205307007,
|
|
"step": 100,
|
|
"valid_targets_mean": 5248.5,
|
|
"valid_targets_min": 570
|
|
},
|
|
{
|
|
"epoch": 0.16279069767441862,
|
|
"grad_norm": 0.6811575704902189,
|
|
"learning_rate": 9.203539823008851e-06,
|
|
"loss": 0.3315,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.38290804624557495,
|
|
"step": 105,
|
|
"valid_targets_mean": 4731.9,
|
|
"valid_targets_min": 422
|
|
},
|
|
{
|
|
"epoch": 0.17054263565891473,
|
|
"grad_norm": 0.5566478870304039,
|
|
"learning_rate": 9.646017699115045e-06,
|
|
"loss": 0.3422,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.313689649105072,
|
|
"step": 110,
|
|
"valid_targets_mean": 4493.0,
|
|
"valid_targets_min": 485
|
|
},
|
|
{
|
|
"epoch": 0.17829457364341086,
|
|
"grad_norm": 0.41287589462882723,
|
|
"learning_rate": 1.008849557522124e-05,
|
|
"loss": 0.2705,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23904478549957275,
|
|
"step": 115,
|
|
"valid_targets_mean": 4980.3,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 0.18604651162790697,
|
|
"grad_norm": 0.522088179939139,
|
|
"learning_rate": 1.0530973451327436e-05,
|
|
"loss": 0.3139,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.31741863489151,
|
|
"step": 120,
|
|
"valid_targets_mean": 3859.9,
|
|
"valid_targets_min": 361
|
|
},
|
|
{
|
|
"epoch": 0.1937984496124031,
|
|
"grad_norm": 0.5022551201886791,
|
|
"learning_rate": 1.0973451327433629e-05,
|
|
"loss": 0.2936,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.29989367723464966,
|
|
"step": 125,
|
|
"valid_targets_mean": 4806.8,
|
|
"valid_targets_min": 2268
|
|
},
|
|
{
|
|
"epoch": 0.20155038759689922,
|
|
"grad_norm": 0.43337385085835556,
|
|
"learning_rate": 1.1415929203539825e-05,
|
|
"loss": 0.316,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.26593732833862305,
|
|
"step": 130,
|
|
"valid_targets_mean": 5703.4,
|
|
"valid_targets_min": 861
|
|
},
|
|
{
|
|
"epoch": 0.20930232558139536,
|
|
"grad_norm": 0.5362034077276845,
|
|
"learning_rate": 1.1858407079646019e-05,
|
|
"loss": 0.2958,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.26804763078689575,
|
|
"step": 135,
|
|
"valid_targets_mean": 5329.9,
|
|
"valid_targets_min": 436
|
|
},
|
|
{
|
|
"epoch": 0.21705426356589147,
|
|
"grad_norm": 0.7869829849569835,
|
|
"learning_rate": 1.2300884955752212e-05,
|
|
"loss": 0.295,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2954621911048889,
|
|
"step": 140,
|
|
"valid_targets_mean": 4087.9,
|
|
"valid_targets_min": 367
|
|
},
|
|
{
|
|
"epoch": 0.2248062015503876,
|
|
"grad_norm": 0.4284133599416018,
|
|
"learning_rate": 1.2743362831858408e-05,
|
|
"loss": 0.2592,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22574186325073242,
|
|
"step": 145,
|
|
"valid_targets_mean": 4778.1,
|
|
"valid_targets_min": 658
|
|
},
|
|
{
|
|
"epoch": 0.23255813953488372,
|
|
"grad_norm": 0.43346642775630995,
|
|
"learning_rate": 1.3185840707964604e-05,
|
|
"loss": 0.265,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2442144900560379,
|
|
"step": 150,
|
|
"valid_targets_mean": 4813.1,
|
|
"valid_targets_min": 370
|
|
},
|
|
{
|
|
"epoch": 0.24031007751937986,
|
|
"grad_norm": 0.4612125175821135,
|
|
"learning_rate": 1.3628318584070797e-05,
|
|
"loss": 0.2645,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25243520736694336,
|
|
"step": 155,
|
|
"valid_targets_mean": 4157.1,
|
|
"valid_targets_min": 806
|
|
},
|
|
{
|
|
"epoch": 0.24806201550387597,
|
|
"grad_norm": 0.4456387275424371,
|
|
"learning_rate": 1.4070796460176991e-05,
|
|
"loss": 0.3351,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.28738337755203247,
|
|
"step": 160,
|
|
"valid_targets_mean": 5481.4,
|
|
"valid_targets_min": 1940
|
|
},
|
|
{
|
|
"epoch": 0.2558139534883721,
|
|
"grad_norm": 0.5654786805272515,
|
|
"learning_rate": 1.4513274336283187e-05,
|
|
"loss": 0.2997,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3355092406272888,
|
|
"step": 165,
|
|
"valid_targets_mean": 5211.9,
|
|
"valid_targets_min": 1841
|
|
},
|
|
{
|
|
"epoch": 0.26356589147286824,
|
|
"grad_norm": 0.4528552978301014,
|
|
"learning_rate": 1.4955752212389383e-05,
|
|
"loss": 0.2687,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24449273943901062,
|
|
"step": 170,
|
|
"valid_targets_mean": 4395.9,
|
|
"valid_targets_min": 716
|
|
},
|
|
{
|
|
"epoch": 0.2713178294573643,
|
|
"grad_norm": 0.5070510356795248,
|
|
"learning_rate": 1.5398230088495576e-05,
|
|
"loss": 0.2736,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2762889266014099,
|
|
"step": 175,
|
|
"valid_targets_mean": 5060.6,
|
|
"valid_targets_min": 332
|
|
},
|
|
{
|
|
"epoch": 0.27906976744186046,
|
|
"grad_norm": 0.4109586147637433,
|
|
"learning_rate": 1.5840707964601772e-05,
|
|
"loss": 0.2469,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.27871203422546387,
|
|
"step": 180,
|
|
"valid_targets_mean": 5762.0,
|
|
"valid_targets_min": 317
|
|
},
|
|
{
|
|
"epoch": 0.2868217054263566,
|
|
"grad_norm": 0.5312588834611185,
|
|
"learning_rate": 1.628318584070797e-05,
|
|
"loss": 0.2602,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21110810339450836,
|
|
"step": 185,
|
|
"valid_targets_mean": 4100.6,
|
|
"valid_targets_min": 312
|
|
},
|
|
{
|
|
"epoch": 0.29457364341085274,
|
|
"grad_norm": 0.5125684260379816,
|
|
"learning_rate": 1.672566371681416e-05,
|
|
"loss": 0.2584,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2507615089416504,
|
|
"step": 190,
|
|
"valid_targets_mean": 4268.3,
|
|
"valid_targets_min": 2439
|
|
},
|
|
{
|
|
"epoch": 0.3023255813953488,
|
|
"grad_norm": 0.6649775832883916,
|
|
"learning_rate": 1.7168141592920354e-05,
|
|
"loss": 0.2877,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.41589394211769104,
|
|
"step": 195,
|
|
"valid_targets_mean": 3739.2,
|
|
"valid_targets_min": 536
|
|
},
|
|
{
|
|
"epoch": 0.31007751937984496,
|
|
"grad_norm": 0.5366482871518907,
|
|
"learning_rate": 1.761061946902655e-05,
|
|
"loss": 0.2587,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.27435043454170227,
|
|
"step": 200,
|
|
"valid_targets_mean": 5772.8,
|
|
"valid_targets_min": 2700
|
|
},
|
|
{
|
|
"epoch": 0.3178294573643411,
|
|
"grad_norm": 0.5074784266785846,
|
|
"learning_rate": 1.8053097345132743e-05,
|
|
"loss": 0.281,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2721036970615387,
|
|
"step": 205,
|
|
"valid_targets_mean": 4397.0,
|
|
"valid_targets_min": 661
|
|
},
|
|
{
|
|
"epoch": 0.32558139534883723,
|
|
"grad_norm": 0.614506165275271,
|
|
"learning_rate": 1.849557522123894e-05,
|
|
"loss": 0.2917,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.30919021368026733,
|
|
"step": 210,
|
|
"valid_targets_mean": 4218.9,
|
|
"valid_targets_min": 472
|
|
},
|
|
{
|
|
"epoch": 0.3333333333333333,
|
|
"grad_norm": 0.5419591558618669,
|
|
"learning_rate": 1.8938053097345135e-05,
|
|
"loss": 0.2622,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23832359910011292,
|
|
"step": 215,
|
|
"valid_targets_mean": 5124.2,
|
|
"valid_targets_min": 2981
|
|
},
|
|
{
|
|
"epoch": 0.34108527131782945,
|
|
"grad_norm": 0.5664964725729073,
|
|
"learning_rate": 1.9380530973451328e-05,
|
|
"loss": 0.2701,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2373562753200531,
|
|
"step": 220,
|
|
"valid_targets_mean": 3882.1,
|
|
"valid_targets_min": 282
|
|
},
|
|
{
|
|
"epoch": 0.3488372093023256,
|
|
"grad_norm": 0.4209274671883887,
|
|
"learning_rate": 1.9823008849557524e-05,
|
|
"loss": 0.2434,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1936969757080078,
|
|
"step": 225,
|
|
"valid_targets_mean": 5481.6,
|
|
"valid_targets_min": 752
|
|
},
|
|
{
|
|
"epoch": 0.35658914728682173,
|
|
"grad_norm": 0.5074693857643466,
|
|
"learning_rate": 2.0265486725663717e-05,
|
|
"loss": 0.253,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25986820459365845,
|
|
"step": 230,
|
|
"valid_targets_mean": 5012.3,
|
|
"valid_targets_min": 1855
|
|
},
|
|
{
|
|
"epoch": 0.3643410852713178,
|
|
"grad_norm": 0.5512784168137245,
|
|
"learning_rate": 2.0707964601769913e-05,
|
|
"loss": 0.2588,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.27459990978240967,
|
|
"step": 235,
|
|
"valid_targets_mean": 4073.4,
|
|
"valid_targets_min": 477
|
|
},
|
|
{
|
|
"epoch": 0.37209302325581395,
|
|
"grad_norm": 0.4347839613276555,
|
|
"learning_rate": 2.115044247787611e-05,
|
|
"loss": 0.2616,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24624979496002197,
|
|
"step": 240,
|
|
"valid_targets_mean": 5311.7,
|
|
"valid_targets_min": 968
|
|
},
|
|
{
|
|
"epoch": 0.3798449612403101,
|
|
"grad_norm": 0.5190963993227697,
|
|
"learning_rate": 2.15929203539823e-05,
|
|
"loss": 0.2566,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.252674400806427,
|
|
"step": 245,
|
|
"valid_targets_mean": 4257.4,
|
|
"valid_targets_min": 2687
|
|
},
|
|
{
|
|
"epoch": 0.3875968992248062,
|
|
"grad_norm": 0.5887863557318684,
|
|
"learning_rate": 2.2035398230088498e-05,
|
|
"loss": 0.2831,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.33351632952690125,
|
|
"step": 250,
|
|
"valid_targets_mean": 5280.2,
|
|
"valid_targets_min": 726
|
|
},
|
|
{
|
|
"epoch": 0.3953488372093023,
|
|
"grad_norm": 0.5068755318361087,
|
|
"learning_rate": 2.247787610619469e-05,
|
|
"loss": 0.2454,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20935970544815063,
|
|
"step": 255,
|
|
"valid_targets_mean": 4357.3,
|
|
"valid_targets_min": 365
|
|
},
|
|
{
|
|
"epoch": 0.40310077519379844,
|
|
"grad_norm": 0.4660973149935113,
|
|
"learning_rate": 2.2920353982300883e-05,
|
|
"loss": 0.2583,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2345641404390335,
|
|
"step": 260,
|
|
"valid_targets_mean": 4675.7,
|
|
"valid_targets_min": 472
|
|
},
|
|
{
|
|
"epoch": 0.4108527131782946,
|
|
"grad_norm": 0.4943641747428354,
|
|
"learning_rate": 2.3362831858407083e-05,
|
|
"loss": 0.2525,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25245875120162964,
|
|
"step": 265,
|
|
"valid_targets_mean": 4586.7,
|
|
"valid_targets_min": 336
|
|
},
|
|
{
|
|
"epoch": 0.4186046511627907,
|
|
"grad_norm": 0.5733463209321147,
|
|
"learning_rate": 2.3805309734513275e-05,
|
|
"loss": 0.256,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2648470103740692,
|
|
"step": 270,
|
|
"valid_targets_mean": 4878.5,
|
|
"valid_targets_min": 1433
|
|
},
|
|
{
|
|
"epoch": 0.4263565891472868,
|
|
"grad_norm": 0.5797109099250628,
|
|
"learning_rate": 2.424778761061947e-05,
|
|
"loss": 0.2686,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23868052661418915,
|
|
"step": 275,
|
|
"valid_targets_mean": 4204.3,
|
|
"valid_targets_min": 1999
|
|
},
|
|
{
|
|
"epoch": 0.43410852713178294,
|
|
"grad_norm": 0.5102454710373611,
|
|
"learning_rate": 2.4690265486725668e-05,
|
|
"loss": 0.2299,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19877958297729492,
|
|
"step": 280,
|
|
"valid_targets_mean": 4676.9,
|
|
"valid_targets_min": 720
|
|
},
|
|
{
|
|
"epoch": 0.4418604651162791,
|
|
"grad_norm": 0.5432212420309249,
|
|
"learning_rate": 2.513274336283186e-05,
|
|
"loss": 0.2822,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.30621248483657837,
|
|
"step": 285,
|
|
"valid_targets_mean": 4931.0,
|
|
"valid_targets_min": 1914
|
|
},
|
|
{
|
|
"epoch": 0.4496124031007752,
|
|
"grad_norm": 0.5173046537936798,
|
|
"learning_rate": 2.5575221238938056e-05,
|
|
"loss": 0.236,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2177397459745407,
|
|
"step": 290,
|
|
"valid_targets_mean": 3951.5,
|
|
"valid_targets_min": 1846
|
|
},
|
|
{
|
|
"epoch": 0.4573643410852713,
|
|
"grad_norm": 0.47098388353840676,
|
|
"learning_rate": 2.601769911504425e-05,
|
|
"loss": 0.2311,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23170709609985352,
|
|
"step": 295,
|
|
"valid_targets_mean": 5152.0,
|
|
"valid_targets_min": 285
|
|
},
|
|
{
|
|
"epoch": 0.46511627906976744,
|
|
"grad_norm": 0.5012563709590744,
|
|
"learning_rate": 2.6460176991150442e-05,
|
|
"loss": 0.2354,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2445349246263504,
|
|
"step": 300,
|
|
"valid_targets_mean": 4086.8,
|
|
"valid_targets_min": 568
|
|
},
|
|
{
|
|
"epoch": 0.4728682170542636,
|
|
"grad_norm": 0.7598417766003686,
|
|
"learning_rate": 2.690265486725664e-05,
|
|
"loss": 0.2685,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2794634699821472,
|
|
"step": 305,
|
|
"valid_targets_mean": 6700.9,
|
|
"valid_targets_min": 2494
|
|
},
|
|
{
|
|
"epoch": 0.4806201550387597,
|
|
"grad_norm": 0.48809284746866477,
|
|
"learning_rate": 2.7345132743362834e-05,
|
|
"loss": 0.251,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23253998160362244,
|
|
"step": 310,
|
|
"valid_targets_mean": 4574.2,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 0.4883720930232558,
|
|
"grad_norm": 0.5629581496018895,
|
|
"learning_rate": 2.7787610619469027e-05,
|
|
"loss": 0.2549,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.275101900100708,
|
|
"step": 315,
|
|
"valid_targets_mean": 4482.4,
|
|
"valid_targets_min": 380
|
|
},
|
|
{
|
|
"epoch": 0.49612403100775193,
|
|
"grad_norm": 0.5149842618437763,
|
|
"learning_rate": 2.8230088495575226e-05,
|
|
"loss": 0.241,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.26416015625,
|
|
"step": 320,
|
|
"valid_targets_mean": 4816.7,
|
|
"valid_targets_min": 2959
|
|
},
|
|
{
|
|
"epoch": 0.5038759689922481,
|
|
"grad_norm": 0.5415600825598276,
|
|
"learning_rate": 2.867256637168142e-05,
|
|
"loss": 0.2523,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2811618149280548,
|
|
"step": 325,
|
|
"valid_targets_mean": 5667.7,
|
|
"valid_targets_min": 559
|
|
},
|
|
{
|
|
"epoch": 0.5116279069767442,
|
|
"grad_norm": 0.5507831167513966,
|
|
"learning_rate": 2.9115044247787612e-05,
|
|
"loss": 0.2434,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2697560787200928,
|
|
"step": 330,
|
|
"valid_targets_mean": 4328.9,
|
|
"valid_targets_min": 314
|
|
},
|
|
{
|
|
"epoch": 0.5193798449612403,
|
|
"grad_norm": 0.444364635402833,
|
|
"learning_rate": 2.9557522123893808e-05,
|
|
"loss": 0.2478,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.26696139574050903,
|
|
"step": 335,
|
|
"valid_targets_mean": 5249.1,
|
|
"valid_targets_min": 216
|
|
},
|
|
{
|
|
"epoch": 0.5271317829457365,
|
|
"grad_norm": 0.5882361391451728,
|
|
"learning_rate": 3.0000000000000004e-05,
|
|
"loss": 0.2576,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2548302412033081,
|
|
"step": 340,
|
|
"valid_targets_mean": 3739.8,
|
|
"valid_targets_min": 2192
|
|
},
|
|
{
|
|
"epoch": 0.5348837209302325,
|
|
"grad_norm": 0.5152875122005142,
|
|
"learning_rate": 3.0442477876106197e-05,
|
|
"loss": 0.2569,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23482279479503632,
|
|
"step": 345,
|
|
"valid_targets_mean": 3619.9,
|
|
"valid_targets_min": 325
|
|
},
|
|
{
|
|
"epoch": 0.5426356589147286,
|
|
"grad_norm": 0.4815633298934971,
|
|
"learning_rate": 3.0884955752212396e-05,
|
|
"loss": 0.2373,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2350481003522873,
|
|
"step": 350,
|
|
"valid_targets_mean": 4721.2,
|
|
"valid_targets_min": 1866
|
|
},
|
|
{
|
|
"epoch": 0.5503875968992248,
|
|
"grad_norm": 0.4648544079642719,
|
|
"learning_rate": 3.132743362831859e-05,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.181733176112175,
|
|
"step": 355,
|
|
"valid_targets_mean": 5043.9,
|
|
"valid_targets_min": 1925
|
|
},
|
|
{
|
|
"epoch": 0.5581395348837209,
|
|
"grad_norm": 0.5037726577202668,
|
|
"learning_rate": 3.176991150442478e-05,
|
|
"loss": 0.2506,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.29893919825553894,
|
|
"step": 360,
|
|
"valid_targets_mean": 4146.6,
|
|
"valid_targets_min": 419
|
|
},
|
|
{
|
|
"epoch": 0.5658914728682171,
|
|
"grad_norm": 0.4516342191965917,
|
|
"learning_rate": 3.2212389380530975e-05,
|
|
"loss": 0.269,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.251533180475235,
|
|
"step": 365,
|
|
"valid_targets_mean": 5648.9,
|
|
"valid_targets_min": 1948
|
|
},
|
|
{
|
|
"epoch": 0.5736434108527132,
|
|
"grad_norm": 0.510314234160131,
|
|
"learning_rate": 3.265486725663717e-05,
|
|
"loss": 0.2389,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2301664650440216,
|
|
"step": 370,
|
|
"valid_targets_mean": 4642.9,
|
|
"valid_targets_min": 357
|
|
},
|
|
{
|
|
"epoch": 0.5813953488372093,
|
|
"grad_norm": 0.5221420257676286,
|
|
"learning_rate": 3.309734513274337e-05,
|
|
"loss": 0.254,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25842761993408203,
|
|
"step": 375,
|
|
"valid_targets_mean": 5166.7,
|
|
"valid_targets_min": 330
|
|
},
|
|
{
|
|
"epoch": 0.5891472868217055,
|
|
"grad_norm": 0.47841880099325107,
|
|
"learning_rate": 3.353982300884956e-05,
|
|
"loss": 0.2427,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23205696046352386,
|
|
"step": 380,
|
|
"valid_targets_mean": 4452.9,
|
|
"valid_targets_min": 2554
|
|
},
|
|
{
|
|
"epoch": 0.5968992248062015,
|
|
"grad_norm": 0.607600902063009,
|
|
"learning_rate": 3.398230088495575e-05,
|
|
"loss": 0.2396,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23086626827716827,
|
|
"step": 385,
|
|
"valid_targets_mean": 4332.0,
|
|
"valid_targets_min": 2478
|
|
},
|
|
{
|
|
"epoch": 0.6046511627906976,
|
|
"grad_norm": 0.5649861293006265,
|
|
"learning_rate": 3.4424778761061945e-05,
|
|
"loss": 0.2331,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2606998682022095,
|
|
"step": 390,
|
|
"valid_targets_mean": 3863.3,
|
|
"valid_targets_min": 355
|
|
},
|
|
{
|
|
"epoch": 0.6124031007751938,
|
|
"grad_norm": 0.5467855289956822,
|
|
"learning_rate": 3.4867256637168145e-05,
|
|
"loss": 0.2519,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24656961858272552,
|
|
"step": 395,
|
|
"valid_targets_mean": 4666.2,
|
|
"valid_targets_min": 1840
|
|
},
|
|
{
|
|
"epoch": 0.6201550387596899,
|
|
"grad_norm": 0.4033482565091616,
|
|
"learning_rate": 3.530973451327434e-05,
|
|
"loss": 0.2317,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19554291665554047,
|
|
"step": 400,
|
|
"valid_targets_mean": 5451.3,
|
|
"valid_targets_min": 285
|
|
},
|
|
{
|
|
"epoch": 0.627906976744186,
|
|
"grad_norm": 0.408434222869372,
|
|
"learning_rate": 3.575221238938053e-05,
|
|
"loss": 0.2523,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20927652716636658,
|
|
"step": 405,
|
|
"valid_targets_mean": 5175.1,
|
|
"valid_targets_min": 719
|
|
},
|
|
{
|
|
"epoch": 0.6356589147286822,
|
|
"grad_norm": 0.5142450144995636,
|
|
"learning_rate": 3.619469026548673e-05,
|
|
"loss": 0.2522,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.28972408175468445,
|
|
"step": 410,
|
|
"valid_targets_mean": 4840.2,
|
|
"valid_targets_min": 330
|
|
},
|
|
{
|
|
"epoch": 0.6434108527131783,
|
|
"grad_norm": 0.5130835281170955,
|
|
"learning_rate": 3.663716814159292e-05,
|
|
"loss": 0.271,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.27192896604537964,
|
|
"step": 415,
|
|
"valid_targets_mean": 4130.9,
|
|
"valid_targets_min": 836
|
|
},
|
|
{
|
|
"epoch": 0.6511627906976745,
|
|
"grad_norm": 0.5264620060585927,
|
|
"learning_rate": 3.707964601769912e-05,
|
|
"loss": 0.2475,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.30271440744400024,
|
|
"step": 420,
|
|
"valid_targets_mean": 4858.8,
|
|
"valid_targets_min": 566
|
|
},
|
|
{
|
|
"epoch": 0.6589147286821705,
|
|
"grad_norm": 0.48973643965756275,
|
|
"learning_rate": 3.7522123893805314e-05,
|
|
"loss": 0.2348,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19385236501693726,
|
|
"step": 425,
|
|
"valid_targets_mean": 4338.8,
|
|
"valid_targets_min": 808
|
|
},
|
|
{
|
|
"epoch": 0.6666666666666666,
|
|
"grad_norm": 0.47842223367968456,
|
|
"learning_rate": 3.796460176991151e-05,
|
|
"loss": 0.2404,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24353685975074768,
|
|
"step": 430,
|
|
"valid_targets_mean": 4000.3,
|
|
"valid_targets_min": 2352
|
|
},
|
|
{
|
|
"epoch": 0.6744186046511628,
|
|
"grad_norm": 0.45816881401918463,
|
|
"learning_rate": 3.840707964601771e-05,
|
|
"loss": 0.2455,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2597430646419525,
|
|
"step": 435,
|
|
"valid_targets_mean": 5271.6,
|
|
"valid_targets_min": 2162
|
|
},
|
|
{
|
|
"epoch": 0.6821705426356589,
|
|
"grad_norm": 0.6017326535707582,
|
|
"learning_rate": 3.88495575221239e-05,
|
|
"loss": 0.2444,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24369432032108307,
|
|
"step": 440,
|
|
"valid_targets_mean": 3065.4,
|
|
"valid_targets_min": 304
|
|
},
|
|
{
|
|
"epoch": 0.689922480620155,
|
|
"grad_norm": 0.5404602142547137,
|
|
"learning_rate": 3.929203539823009e-05,
|
|
"loss": 0.2078,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.256170392036438,
|
|
"step": 445,
|
|
"valid_targets_mean": 3592.6,
|
|
"valid_targets_min": 639
|
|
},
|
|
{
|
|
"epoch": 0.6976744186046512,
|
|
"grad_norm": 0.4154279511759285,
|
|
"learning_rate": 3.9734513274336285e-05,
|
|
"loss": 0.2272,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21489651501178741,
|
|
"step": 450,
|
|
"valid_targets_mean": 4713.6,
|
|
"valid_targets_min": 639
|
|
},
|
|
{
|
|
"epoch": 0.7054263565891473,
|
|
"grad_norm": 0.3730389962722997,
|
|
"learning_rate": 3.999997608524118e-05,
|
|
"loss": 0.2123,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1950041949748993,
|
|
"step": 455,
|
|
"valid_targets_mean": 6850.4,
|
|
"valid_targets_min": 2445
|
|
},
|
|
{
|
|
"epoch": 0.7131782945736435,
|
|
"grad_norm": 0.5017736757425001,
|
|
"learning_rate": 3.999970704486118e-05,
|
|
"loss": 0.2408,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2439410388469696,
|
|
"step": 460,
|
|
"valid_targets_mean": 4726.7,
|
|
"valid_targets_min": 1933
|
|
},
|
|
{
|
|
"epoch": 0.7209302325581395,
|
|
"grad_norm": 0.5145474700945507,
|
|
"learning_rate": 3.999913907468731e-05,
|
|
"loss": 0.2448,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2903444170951843,
|
|
"step": 465,
|
|
"valid_targets_mean": 3954.4,
|
|
"valid_targets_min": 606
|
|
},
|
|
{
|
|
"epoch": 0.7286821705426356,
|
|
"grad_norm": 0.39985614862149943,
|
|
"learning_rate": 3.9998272183208866e-05,
|
|
"loss": 0.242,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23064105212688446,
|
|
"step": 470,
|
|
"valid_targets_mean": 5725.1,
|
|
"valid_targets_min": 1885
|
|
},
|
|
{
|
|
"epoch": 0.7364341085271318,
|
|
"grad_norm": 0.47106899849704376,
|
|
"learning_rate": 3.999710638338303e-05,
|
|
"loss": 0.2096,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2777732014656067,
|
|
"step": 475,
|
|
"valid_targets_mean": 4932.4,
|
|
"valid_targets_min": 2437
|
|
},
|
|
{
|
|
"epoch": 0.7441860465116279,
|
|
"grad_norm": 0.5041908945885922,
|
|
"learning_rate": 3.999564169263465e-05,
|
|
"loss": 0.2204,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22737307846546173,
|
|
"step": 480,
|
|
"valid_targets_mean": 4427.4,
|
|
"valid_targets_min": 1030
|
|
},
|
|
{
|
|
"epoch": 0.751937984496124,
|
|
"grad_norm": 0.49803283079798477,
|
|
"learning_rate": 3.9993878132856044e-05,
|
|
"loss": 0.2328,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2756238579750061,
|
|
"step": 485,
|
|
"valid_targets_mean": 4327.5,
|
|
"valid_targets_min": 783
|
|
},
|
|
{
|
|
"epoch": 0.7596899224806202,
|
|
"grad_norm": 0.4206493823677622,
|
|
"learning_rate": 3.999181573040663e-05,
|
|
"loss": 0.2214,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2046414017677307,
|
|
"step": 490,
|
|
"valid_targets_mean": 5396.8,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 0.7674418604651163,
|
|
"grad_norm": 0.4197719415269444,
|
|
"learning_rate": 3.9989454516112524e-05,
|
|
"loss": 0.25,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2041558027267456,
|
|
"step": 495,
|
|
"valid_targets_mean": 4688.8,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 0.7751937984496124,
|
|
"grad_norm": 0.49956665072862294,
|
|
"learning_rate": 3.9986794525266115e-05,
|
|
"loss": 0.2538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2720697820186615,
|
|
"step": 500,
|
|
"valid_targets_mean": 4991.1,
|
|
"valid_targets_min": 2320
|
|
},
|
|
{
|
|
"epoch": 0.7829457364341085,
|
|
"grad_norm": 0.5668838261772827,
|
|
"learning_rate": 3.998383579762552e-05,
|
|
"loss": 0.2275,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22524034976959229,
|
|
"step": 505,
|
|
"valid_targets_mean": 4758.6,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 0.7906976744186046,
|
|
"grad_norm": 0.4067566904060681,
|
|
"learning_rate": 3.998057837741396e-05,
|
|
"loss": 0.2368,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20347392559051514,
|
|
"step": 510,
|
|
"valid_targets_mean": 5299.1,
|
|
"valid_targets_min": 957
|
|
},
|
|
{
|
|
"epoch": 0.7984496124031008,
|
|
"grad_norm": 0.4983262141277965,
|
|
"learning_rate": 3.997702231331917e-05,
|
|
"loss": 0.2254,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22835250198841095,
|
|
"step": 515,
|
|
"valid_targets_mean": 4676.3,
|
|
"valid_targets_min": 1825
|
|
},
|
|
{
|
|
"epoch": 0.8062015503875969,
|
|
"grad_norm": 0.4874737761112375,
|
|
"learning_rate": 3.9973167658492577e-05,
|
|
"loss": 0.2326,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1982721984386444,
|
|
"step": 520,
|
|
"valid_targets_mean": 3951.7,
|
|
"valid_targets_min": 308
|
|
},
|
|
{
|
|
"epoch": 0.813953488372093,
|
|
"grad_norm": 0.4874095166955721,
|
|
"learning_rate": 3.99690144705486e-05,
|
|
"loss": 0.2588,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.27957573533058167,
|
|
"step": 525,
|
|
"valid_targets_mean": 4523.2,
|
|
"valid_targets_min": 630
|
|
},
|
|
{
|
|
"epoch": 0.8217054263565892,
|
|
"grad_norm": 0.46829582316727847,
|
|
"learning_rate": 3.996456281156372e-05,
|
|
"loss": 0.2304,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2339038848876953,
|
|
"step": 530,
|
|
"valid_targets_mean": 4400.8,
|
|
"valid_targets_min": 996
|
|
},
|
|
{
|
|
"epoch": 0.8294573643410853,
|
|
"grad_norm": 0.4173667508062997,
|
|
"learning_rate": 3.995981274807561e-05,
|
|
"loss": 0.2288,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19771169126033783,
|
|
"step": 535,
|
|
"valid_targets_mean": 4821.5,
|
|
"valid_targets_min": 978
|
|
},
|
|
{
|
|
"epoch": 0.8372093023255814,
|
|
"grad_norm": 0.4998240530264507,
|
|
"learning_rate": 3.995476435108205e-05,
|
|
"loss": 0.2204,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23739448189735413,
|
|
"step": 540,
|
|
"valid_targets_mean": 3693.3,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 0.8449612403100775,
|
|
"grad_norm": 0.40077148780586164,
|
|
"learning_rate": 3.994941769603999e-05,
|
|
"loss": 0.2402,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25493863224983215,
|
|
"step": 545,
|
|
"valid_targets_mean": 6980.4,
|
|
"valid_targets_min": 3136
|
|
},
|
|
{
|
|
"epoch": 0.8527131782945736,
|
|
"grad_norm": 0.5106995708311232,
|
|
"learning_rate": 3.9943772862864303e-05,
|
|
"loss": 0.248,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.295318067073822,
|
|
"step": 550,
|
|
"valid_targets_mean": 4588.8,
|
|
"valid_targets_min": 2486
|
|
},
|
|
{
|
|
"epoch": 0.8604651162790697,
|
|
"grad_norm": 0.4775850652610667,
|
|
"learning_rate": 3.993782993592668e-05,
|
|
"loss": 0.2244,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2367231398820877,
|
|
"step": 555,
|
|
"valid_targets_mean": 4133.6,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 0.8682170542635659,
|
|
"grad_norm": 0.4680021737678082,
|
|
"learning_rate": 3.9931589004054305e-05,
|
|
"loss": 0.2394,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23238858580589294,
|
|
"step": 560,
|
|
"valid_targets_mean": 4216.1,
|
|
"valid_targets_min": 516
|
|
},
|
|
{
|
|
"epoch": 0.875968992248062,
|
|
"grad_norm": 0.5582382675085276,
|
|
"learning_rate": 3.992505016052858e-05,
|
|
"loss": 0.2275,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24689146876335144,
|
|
"step": 565,
|
|
"valid_targets_mean": 4033.6,
|
|
"valid_targets_min": 1922
|
|
},
|
|
{
|
|
"epoch": 0.8837209302325582,
|
|
"grad_norm": 0.48825810766144667,
|
|
"learning_rate": 3.991821350308369e-05,
|
|
"loss": 0.2269,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23387084901332855,
|
|
"step": 570,
|
|
"valid_targets_mean": 4010.4,
|
|
"valid_targets_min": 946
|
|
},
|
|
{
|
|
"epoch": 0.8914728682170543,
|
|
"grad_norm": 0.3468810555031447,
|
|
"learning_rate": 3.991107913390516e-05,
|
|
"loss": 0.2017,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16606643795967102,
|
|
"step": 575,
|
|
"valid_targets_mean": 6431.9,
|
|
"valid_targets_min": 2510
|
|
},
|
|
{
|
|
"epoch": 0.8992248062015504,
|
|
"grad_norm": 0.4163415879240496,
|
|
"learning_rate": 3.990364715962833e-05,
|
|
"loss": 0.2258,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1997481882572174,
|
|
"step": 580,
|
|
"valid_targets_mean": 5320.4,
|
|
"valid_targets_min": 2104
|
|
},
|
|
{
|
|
"epoch": 0.9069767441860465,
|
|
"grad_norm": 0.5473724440573992,
|
|
"learning_rate": 3.989591769133675e-05,
|
|
"loss": 0.2154,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24773220717906952,
|
|
"step": 585,
|
|
"valid_targets_mean": 4261.8,
|
|
"valid_targets_min": 434
|
|
},
|
|
{
|
|
"epoch": 0.9147286821705426,
|
|
"grad_norm": 0.5436217489799219,
|
|
"learning_rate": 3.988789084456054e-05,
|
|
"loss": 0.232,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.26351064443588257,
|
|
"step": 590,
|
|
"valid_targets_mean": 3915.2,
|
|
"valid_targets_min": 551
|
|
},
|
|
{
|
|
"epoch": 0.9224806201550387,
|
|
"grad_norm": 0.41536583827338946,
|
|
"learning_rate": 3.9879566739274626e-05,
|
|
"loss": 0.2094,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2559744715690613,
|
|
"step": 595,
|
|
"valid_targets_mean": 5054.2,
|
|
"valid_targets_min": 2545
|
|
},
|
|
{
|
|
"epoch": 0.9302325581395349,
|
|
"grad_norm": 0.35411011586501473,
|
|
"learning_rate": 3.987094549989699e-05,
|
|
"loss": 0.2118,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18530899286270142,
|
|
"step": 600,
|
|
"valid_targets_mean": 5971.2,
|
|
"valid_targets_min": 1835
|
|
},
|
|
{
|
|
"epoch": 0.937984496124031,
|
|
"grad_norm": 0.4392551065067926,
|
|
"learning_rate": 3.98620272552868e-05,
|
|
"loss": 0.2495,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21953071653842926,
|
|
"step": 605,
|
|
"valid_targets_mean": 4565.2,
|
|
"valid_targets_min": 1942
|
|
},
|
|
{
|
|
"epoch": 0.9457364341085271,
|
|
"grad_norm": 0.47803844935864886,
|
|
"learning_rate": 3.985281213874244e-05,
|
|
"loss": 0.2298,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.29870736598968506,
|
|
"step": 610,
|
|
"valid_targets_mean": 4237.6,
|
|
"valid_targets_min": 326
|
|
},
|
|
{
|
|
"epoch": 0.9534883720930233,
|
|
"grad_norm": 0.44870011943315186,
|
|
"learning_rate": 3.984330028799957e-05,
|
|
"loss": 0.2274,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2335856556892395,
|
|
"step": 615,
|
|
"valid_targets_mean": 4557.3,
|
|
"valid_targets_min": 849
|
|
},
|
|
{
|
|
"epoch": 0.9612403100775194,
|
|
"grad_norm": 0.5014485102007264,
|
|
"learning_rate": 3.9833491845229065e-05,
|
|
"loss": 0.2085,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.253334641456604,
|
|
"step": 620,
|
|
"valid_targets_mean": 3717.8,
|
|
"valid_targets_min": 926
|
|
},
|
|
{
|
|
"epoch": 0.9689922480620154,
|
|
"grad_norm": 0.4539009088514093,
|
|
"learning_rate": 3.982338695703486e-05,
|
|
"loss": 0.2471,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2949668765068054,
|
|
"step": 625,
|
|
"valid_targets_mean": 4934.7,
|
|
"valid_targets_min": 685
|
|
},
|
|
{
|
|
"epoch": 0.9767441860465116,
|
|
"grad_norm": 0.42836269237630537,
|
|
"learning_rate": 3.9812985774451763e-05,
|
|
"loss": 0.227,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23034946620464325,
|
|
"step": 630,
|
|
"valid_targets_mean": 4939.8,
|
|
"valid_targets_min": 2461
|
|
},
|
|
{
|
|
"epoch": 0.9844961240310077,
|
|
"grad_norm": 0.6158981927965868,
|
|
"learning_rate": 3.980228845294323e-05,
|
|
"loss": 0.2103,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23234328627586365,
|
|
"step": 635,
|
|
"valid_targets_mean": 4101.9,
|
|
"valid_targets_min": 386
|
|
},
|
|
{
|
|
"epoch": 0.9922480620155039,
|
|
"grad_norm": 0.4762142114139161,
|
|
"learning_rate": 3.9791295152399014e-05,
|
|
"loss": 0.2229,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20974400639533997,
|
|
"step": 640,
|
|
"valid_targets_mean": 3889.9,
|
|
"valid_targets_min": 266
|
|
},
|
|
{
|
|
"epoch": 1.0,
|
|
"grad_norm": 0.5061517747796611,
|
|
"learning_rate": 3.978000603713276e-05,
|
|
"loss": 0.2162,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21345987915992737,
|
|
"step": 645,
|
|
"valid_targets_mean": 3841.9,
|
|
"valid_targets_min": 725
|
|
},
|
|
{
|
|
"epoch": 1.0077519379844961,
|
|
"grad_norm": 0.7869218457307112,
|
|
"learning_rate": 3.976842127587959e-05,
|
|
"loss": 0.2392,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23174425959587097,
|
|
"step": 650,
|
|
"valid_targets_mean": 5303.6,
|
|
"valid_targets_min": 1966
|
|
},
|
|
{
|
|
"epoch": 1.0155038759689923,
|
|
"grad_norm": 0.5003906965370145,
|
|
"learning_rate": 3.975654104179356e-05,
|
|
"loss": 0.2077,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22817862033843994,
|
|
"step": 655,
|
|
"valid_targets_mean": 3844.0,
|
|
"valid_targets_min": 568
|
|
},
|
|
{
|
|
"epoch": 1.0232558139534884,
|
|
"grad_norm": 0.4114203739700514,
|
|
"learning_rate": 3.9744365512445056e-05,
|
|
"loss": 0.2283,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25271815061569214,
|
|
"step": 660,
|
|
"valid_targets_mean": 5901.1,
|
|
"valid_targets_min": 2452
|
|
},
|
|
{
|
|
"epoch": 1.0310077519379846,
|
|
"grad_norm": 0.4575096509840006,
|
|
"learning_rate": 3.973189486981818e-05,
|
|
"loss": 0.2171,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2162925899028778,
|
|
"step": 665,
|
|
"valid_targets_mean": 4902.4,
|
|
"valid_targets_min": 497
|
|
},
|
|
{
|
|
"epoch": 1.0387596899224807,
|
|
"grad_norm": 0.4021600509804852,
|
|
"learning_rate": 3.971912930030799e-05,
|
|
"loss": 0.2048,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19043004512786865,
|
|
"step": 670,
|
|
"valid_targets_mean": 4917.0,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 1.0465116279069768,
|
|
"grad_norm": 0.4989156170962161,
|
|
"learning_rate": 3.970606899471774e-05,
|
|
"loss": 0.2215,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17856532335281372,
|
|
"step": 675,
|
|
"valid_targets_mean": 4752.6,
|
|
"valid_targets_min": 502
|
|
},
|
|
{
|
|
"epoch": 1.054263565891473,
|
|
"grad_norm": 0.3847796119558988,
|
|
"learning_rate": 3.969271414825599e-05,
|
|
"loss": 0.1926,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20729967951774597,
|
|
"step": 680,
|
|
"valid_targets_mean": 5683.9,
|
|
"valid_targets_min": 1844
|
|
},
|
|
{
|
|
"epoch": 1.062015503875969,
|
|
"grad_norm": 0.47657171710131,
|
|
"learning_rate": 3.967906496053377e-05,
|
|
"loss": 0.2187,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21222332119941711,
|
|
"step": 685,
|
|
"valid_targets_mean": 4150.8,
|
|
"valid_targets_min": 962
|
|
},
|
|
{
|
|
"epoch": 1.069767441860465,
|
|
"grad_norm": 0.3858090579432838,
|
|
"learning_rate": 3.966512163556149e-05,
|
|
"loss": 0.2201,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2170460969209671,
|
|
"step": 690,
|
|
"valid_targets_mean": 5164.2,
|
|
"valid_targets_min": 1885
|
|
},
|
|
{
|
|
"epoch": 1.0775193798449612,
|
|
"grad_norm": 0.4290059612627937,
|
|
"learning_rate": 3.965088438174597e-05,
|
|
"loss": 0.1915,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1908944547176361,
|
|
"step": 695,
|
|
"valid_targets_mean": 4788.8,
|
|
"valid_targets_min": 676
|
|
},
|
|
{
|
|
"epoch": 1.0852713178294573,
|
|
"grad_norm": 0.4409936183324337,
|
|
"learning_rate": 3.963635341188729e-05,
|
|
"loss": 0.2102,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23212580382823944,
|
|
"step": 700,
|
|
"valid_targets_mean": 4988.8,
|
|
"valid_targets_min": 558
|
|
},
|
|
{
|
|
"epoch": 1.0930232558139534,
|
|
"grad_norm": 0.45813599715819825,
|
|
"learning_rate": 3.962152894317564e-05,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23683017492294312,
|
|
"step": 705,
|
|
"valid_targets_mean": 4570.3,
|
|
"valid_targets_min": 2488
|
|
},
|
|
{
|
|
"epoch": 1.1007751937984496,
|
|
"grad_norm": 0.40951900195560925,
|
|
"learning_rate": 3.960641119718802e-05,
|
|
"loss": 0.2143,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2278529703617096,
|
|
"step": 710,
|
|
"valid_targets_mean": 5026.8,
|
|
"valid_targets_min": 393
|
|
},
|
|
{
|
|
"epoch": 1.1085271317829457,
|
|
"grad_norm": 0.36962646479291916,
|
|
"learning_rate": 3.9591000399884974e-05,
|
|
"loss": 0.1855,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19535881280899048,
|
|
"step": 715,
|
|
"valid_targets_mean": 5893.4,
|
|
"valid_targets_min": 1714
|
|
},
|
|
{
|
|
"epoch": 1.1162790697674418,
|
|
"grad_norm": 0.4169785909813559,
|
|
"learning_rate": 3.957529678160721e-05,
|
|
"loss": 0.2211,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22500549256801605,
|
|
"step": 720,
|
|
"valid_targets_mean": 5345.6,
|
|
"valid_targets_min": 512
|
|
},
|
|
{
|
|
"epoch": 1.124031007751938,
|
|
"grad_norm": 0.49607819631085537,
|
|
"learning_rate": 3.9559300577072115e-05,
|
|
"loss": 0.2299,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25468283891677856,
|
|
"step": 725,
|
|
"valid_targets_mean": 5040.8,
|
|
"valid_targets_min": 2775
|
|
},
|
|
{
|
|
"epoch": 1.1317829457364341,
|
|
"grad_norm": 0.5069100805388594,
|
|
"learning_rate": 3.954301202537032e-05,
|
|
"loss": 0.1978,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1782360076904297,
|
|
"step": 730,
|
|
"valid_targets_mean": 5846.9,
|
|
"valid_targets_min": 2328
|
|
},
|
|
{
|
|
"epoch": 1.1395348837209303,
|
|
"grad_norm": 0.5044747278952141,
|
|
"learning_rate": 3.952643136996205e-05,
|
|
"loss": 0.2022,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22031991183757782,
|
|
"step": 735,
|
|
"valid_targets_mean": 3806.4,
|
|
"valid_targets_min": 250
|
|
},
|
|
{
|
|
"epoch": 1.1472868217054264,
|
|
"grad_norm": 0.713115718875641,
|
|
"learning_rate": 3.950955885867353e-05,
|
|
"loss": 0.1987,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17436224222183228,
|
|
"step": 740,
|
|
"valid_targets_mean": 4936.1,
|
|
"valid_targets_min": 2127
|
|
},
|
|
{
|
|
"epoch": 1.1550387596899225,
|
|
"grad_norm": 0.5036250359903303,
|
|
"learning_rate": 3.9492394743693266e-05,
|
|
"loss": 0.2187,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2408798635005951,
|
|
"step": 745,
|
|
"valid_targets_mean": 3656.3,
|
|
"valid_targets_min": 555
|
|
},
|
|
{
|
|
"epoch": 1.1627906976744187,
|
|
"grad_norm": 0.46006096792307244,
|
|
"learning_rate": 3.94749392815683e-05,
|
|
"loss": 0.1973,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19669455289840698,
|
|
"step": 750,
|
|
"valid_targets_mean": 4952.6,
|
|
"valid_targets_min": 1766
|
|
},
|
|
{
|
|
"epoch": 1.1705426356589148,
|
|
"grad_norm": 0.4672041249500244,
|
|
"learning_rate": 3.9457192733200315e-05,
|
|
"loss": 0.2053,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1791488230228424,
|
|
"step": 755,
|
|
"valid_targets_mean": 4441.9,
|
|
"valid_targets_min": 650
|
|
},
|
|
{
|
|
"epoch": 1.178294573643411,
|
|
"grad_norm": 0.42348721602696954,
|
|
"learning_rate": 3.9439155363841814e-05,
|
|
"loss": 0.2092,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17398425936698914,
|
|
"step": 760,
|
|
"valid_targets_mean": 4538.8,
|
|
"valid_targets_min": 277
|
|
},
|
|
{
|
|
"epoch": 1.1860465116279069,
|
|
"grad_norm": 0.5878356373078284,
|
|
"learning_rate": 3.9420827443092104e-05,
|
|
"loss": 0.2076,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2349127233028412,
|
|
"step": 765,
|
|
"valid_targets_mean": 4086.5,
|
|
"valid_targets_min": 644
|
|
},
|
|
{
|
|
"epoch": 1.193798449612403,
|
|
"grad_norm": 0.476452037868028,
|
|
"learning_rate": 3.940220924489327e-05,
|
|
"loss": 0.2181,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2374195158481598,
|
|
"step": 770,
|
|
"valid_targets_mean": 3906.2,
|
|
"valid_targets_min": 487
|
|
},
|
|
{
|
|
"epoch": 1.2015503875968991,
|
|
"grad_norm": 0.4353925367240353,
|
|
"learning_rate": 3.938330104752609e-05,
|
|
"loss": 0.2182,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20411117374897003,
|
|
"step": 775,
|
|
"valid_targets_mean": 4184.5,
|
|
"valid_targets_min": 317
|
|
},
|
|
{
|
|
"epoch": 1.2093023255813953,
|
|
"grad_norm": 0.44738786787353246,
|
|
"learning_rate": 3.936410313360589e-05,
|
|
"loss": 0.2074,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.29115378856658936,
|
|
"step": 780,
|
|
"valid_targets_mean": 5176.8,
|
|
"valid_targets_min": 2427
|
|
},
|
|
{
|
|
"epoch": 1.2170542635658914,
|
|
"grad_norm": 0.5025078305803677,
|
|
"learning_rate": 3.934461579007829e-05,
|
|
"loss": 0.1905,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.194045752286911,
|
|
"step": 785,
|
|
"valid_targets_mean": 4190.2,
|
|
"valid_targets_min": 2274
|
|
},
|
|
{
|
|
"epoch": 1.2248062015503876,
|
|
"grad_norm": 0.399168491370644,
|
|
"learning_rate": 3.932483930821495e-05,
|
|
"loss": 0.2027,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19120316207408905,
|
|
"step": 790,
|
|
"valid_targets_mean": 5678.2,
|
|
"valid_targets_min": 2268
|
|
},
|
|
{
|
|
"epoch": 1.2325581395348837,
|
|
"grad_norm": 0.40122275394036194,
|
|
"learning_rate": 3.930477398360915e-05,
|
|
"loss": 0.2109,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20044457912445068,
|
|
"step": 795,
|
|
"valid_targets_mean": 5078.8,
|
|
"valid_targets_min": 1999
|
|
},
|
|
{
|
|
"epoch": 1.2403100775193798,
|
|
"grad_norm": 0.42534010971764247,
|
|
"learning_rate": 3.928442011617148e-05,
|
|
"loss": 0.2093,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21228013932704926,
|
|
"step": 800,
|
|
"valid_targets_mean": 3933.1,
|
|
"valid_targets_min": 757
|
|
},
|
|
{
|
|
"epoch": 1.248062015503876,
|
|
"grad_norm": 0.7069266989704566,
|
|
"learning_rate": 3.926377801012526e-05,
|
|
"loss": 0.2367,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22949740290641785,
|
|
"step": 805,
|
|
"valid_targets_mean": 4512.6,
|
|
"valid_targets_min": 299
|
|
},
|
|
{
|
|
"epoch": 1.255813953488372,
|
|
"grad_norm": 0.42027583645711425,
|
|
"learning_rate": 3.9242847974002026e-05,
|
|
"loss": 0.2204,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2134920060634613,
|
|
"step": 810,
|
|
"valid_targets_mean": 4943.6,
|
|
"valid_targets_min": 1805
|
|
},
|
|
{
|
|
"epoch": 1.2635658914728682,
|
|
"grad_norm": 0.39016064981111986,
|
|
"learning_rate": 3.9221630320636935e-05,
|
|
"loss": 0.2095,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19790124893188477,
|
|
"step": 815,
|
|
"valid_targets_mean": 4984.6,
|
|
"valid_targets_min": 2085
|
|
},
|
|
{
|
|
"epoch": 1.2713178294573644,
|
|
"grad_norm": 0.48120226759216767,
|
|
"learning_rate": 3.9200125367164076e-05,
|
|
"loss": 0.2083,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19904130697250366,
|
|
"step": 820,
|
|
"valid_targets_mean": 3452.6,
|
|
"valid_targets_min": 477
|
|
},
|
|
{
|
|
"epoch": 1.2790697674418605,
|
|
"grad_norm": 0.4551570397834542,
|
|
"learning_rate": 3.917833343501171e-05,
|
|
"loss": 0.1955,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19769467413425446,
|
|
"step": 825,
|
|
"valid_targets_mean": 5811.2,
|
|
"valid_targets_min": 923
|
|
},
|
|
{
|
|
"epoch": 1.2868217054263567,
|
|
"grad_norm": 0.43735207764564604,
|
|
"learning_rate": 3.91562548498975e-05,
|
|
"loss": 0.1992,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20643508434295654,
|
|
"step": 830,
|
|
"valid_targets_mean": 4570.1,
|
|
"valid_targets_min": 2493
|
|
},
|
|
{
|
|
"epoch": 1.2945736434108528,
|
|
"grad_norm": 0.4299580048955895,
|
|
"learning_rate": 3.913388994182364e-05,
|
|
"loss": 0.2196,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18837128579616547,
|
|
"step": 835,
|
|
"valid_targets_mean": 4744.1,
|
|
"valid_targets_min": 881
|
|
},
|
|
{
|
|
"epoch": 1.302325581395349,
|
|
"grad_norm": 0.3538726377495065,
|
|
"learning_rate": 3.9111239045071876e-05,
|
|
"loss": 0.1755,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13884110748767853,
|
|
"step": 840,
|
|
"valid_targets_mean": 5657.9,
|
|
"valid_targets_min": 453
|
|
},
|
|
{
|
|
"epoch": 1.310077519379845,
|
|
"grad_norm": 0.48494658304811955,
|
|
"learning_rate": 3.9088302498198564e-05,
|
|
"loss": 0.2032,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21122536063194275,
|
|
"step": 845,
|
|
"valid_targets_mean": 4122.8,
|
|
"valid_targets_min": 264
|
|
},
|
|
{
|
|
"epoch": 1.3178294573643412,
|
|
"grad_norm": 0.40106643807384035,
|
|
"learning_rate": 3.90650806440296e-05,
|
|
"loss": 0.1862,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19900798797607422,
|
|
"step": 850,
|
|
"valid_targets_mean": 5050.8,
|
|
"valid_targets_min": 2416
|
|
},
|
|
{
|
|
"epoch": 1.3255813953488373,
|
|
"grad_norm": 0.3960604184673925,
|
|
"learning_rate": 3.904157382965526e-05,
|
|
"loss": 0.2157,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22484715282917023,
|
|
"step": 855,
|
|
"valid_targets_mean": 5748.9,
|
|
"valid_targets_min": 1856
|
|
},
|
|
{
|
|
"epoch": 1.3333333333333333,
|
|
"grad_norm": 0.3257220820239636,
|
|
"learning_rate": 3.9017782406425045e-05,
|
|
"loss": 0.2088,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16785819828510284,
|
|
"step": 860,
|
|
"valid_targets_mean": 5923.4,
|
|
"valid_targets_min": 2779
|
|
},
|
|
{
|
|
"epoch": 1.3410852713178294,
|
|
"grad_norm": 0.4239797338208263,
|
|
"learning_rate": 3.899370672994244e-05,
|
|
"loss": 0.2188,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1850738823413849,
|
|
"step": 865,
|
|
"valid_targets_mean": 4976.4,
|
|
"valid_targets_min": 695
|
|
},
|
|
{
|
|
"epoch": 1.3488372093023255,
|
|
"grad_norm": 0.4680128138024682,
|
|
"learning_rate": 3.896934716005956e-05,
|
|
"loss": 0.219,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23862537741661072,
|
|
"step": 870,
|
|
"valid_targets_mean": 4609.4,
|
|
"valid_targets_min": 321
|
|
},
|
|
{
|
|
"epoch": 1.3565891472868217,
|
|
"grad_norm": 0.34295981747721627,
|
|
"learning_rate": 3.8944704060871803e-05,
|
|
"loss": 0.2328,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19128797948360443,
|
|
"step": 875,
|
|
"valid_targets_mean": 6440.4,
|
|
"valid_targets_min": 2928
|
|
},
|
|
{
|
|
"epoch": 1.3643410852713178,
|
|
"grad_norm": 0.39579678053682266,
|
|
"learning_rate": 3.891977780071238e-05,
|
|
"loss": 0.2386,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22662851214408875,
|
|
"step": 880,
|
|
"valid_targets_mean": 5590.4,
|
|
"valid_targets_min": 418
|
|
},
|
|
{
|
|
"epoch": 1.372093023255814,
|
|
"grad_norm": 0.3650270597088362,
|
|
"learning_rate": 3.889456875214685e-05,
|
|
"loss": 0.2028,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18867811560630798,
|
|
"step": 885,
|
|
"valid_targets_mean": 5108.4,
|
|
"valid_targets_min": 2550
|
|
},
|
|
{
|
|
"epoch": 1.37984496124031,
|
|
"grad_norm": 0.43546961058361106,
|
|
"learning_rate": 3.8869077291967514e-05,
|
|
"loss": 0.2091,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18624623119831085,
|
|
"step": 890,
|
|
"valid_targets_mean": 3812.8,
|
|
"valid_targets_min": 310
|
|
},
|
|
{
|
|
"epoch": 1.3875968992248062,
|
|
"grad_norm": 0.35003941903300767,
|
|
"learning_rate": 3.88433038011878e-05,
|
|
"loss": 0.1911,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17150872945785522,
|
|
"step": 895,
|
|
"valid_targets_mean": 5599.2,
|
|
"valid_targets_min": 2853
|
|
},
|
|
{
|
|
"epoch": 1.3953488372093024,
|
|
"grad_norm": 0.40616386423722534,
|
|
"learning_rate": 3.881724866503656e-05,
|
|
"loss": 0.207,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.221075639128685,
|
|
"step": 900,
|
|
"valid_targets_mean": 4683.5,
|
|
"valid_targets_min": 1955
|
|
},
|
|
{
|
|
"epoch": 1.4031007751937985,
|
|
"grad_norm": 0.45770780156293883,
|
|
"learning_rate": 3.879091227295233e-05,
|
|
"loss": 0.2342,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3284824788570404,
|
|
"step": 905,
|
|
"valid_targets_mean": 5965.8,
|
|
"valid_targets_min": 2467
|
|
},
|
|
{
|
|
"epoch": 1.4108527131782946,
|
|
"grad_norm": 0.43076323744174305,
|
|
"learning_rate": 3.876429501857748e-05,
|
|
"loss": 0.2165,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2374260425567627,
|
|
"step": 910,
|
|
"valid_targets_mean": 5230.9,
|
|
"valid_targets_min": 2401
|
|
},
|
|
{
|
|
"epoch": 1.4186046511627908,
|
|
"grad_norm": 0.4744851861080025,
|
|
"learning_rate": 3.873739729975237e-05,
|
|
"loss": 0.2156,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22709140181541443,
|
|
"step": 915,
|
|
"valid_targets_mean": 3975.9,
|
|
"valid_targets_min": 281
|
|
},
|
|
{
|
|
"epoch": 1.4263565891472867,
|
|
"grad_norm": 0.4914323912239341,
|
|
"learning_rate": 3.871021951850935e-05,
|
|
"loss": 0.2059,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2681000232696533,
|
|
"step": 920,
|
|
"valid_targets_mean": 4153.2,
|
|
"valid_targets_min": 579
|
|
},
|
|
{
|
|
"epoch": 1.4341085271317828,
|
|
"grad_norm": 0.5702552607786674,
|
|
"learning_rate": 3.868276208106681e-05,
|
|
"loss": 0.2307,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23841242492198944,
|
|
"step": 925,
|
|
"valid_targets_mean": 4588.2,
|
|
"valid_targets_min": 330
|
|
},
|
|
{
|
|
"epoch": 1.441860465116279,
|
|
"grad_norm": 0.4960800862921102,
|
|
"learning_rate": 3.8655025397823054e-05,
|
|
"loss": 0.1843,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19032783806324005,
|
|
"step": 930,
|
|
"valid_targets_mean": 4889.1,
|
|
"valid_targets_min": 792
|
|
},
|
|
{
|
|
"epoch": 1.449612403100775,
|
|
"grad_norm": 0.3982547722090709,
|
|
"learning_rate": 3.862700988335022e-05,
|
|
"loss": 0.2096,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19539685547351837,
|
|
"step": 935,
|
|
"valid_targets_mean": 5027.4,
|
|
"valid_targets_min": 2790
|
|
},
|
|
{
|
|
"epoch": 1.4573643410852712,
|
|
"grad_norm": 0.4822298209707658,
|
|
"learning_rate": 3.8598715956388026e-05,
|
|
"loss": 0.218,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19648897647857666,
|
|
"step": 940,
|
|
"valid_targets_mean": 3873.2,
|
|
"valid_targets_min": 346
|
|
},
|
|
{
|
|
"epoch": 1.4651162790697674,
|
|
"grad_norm": 0.372486771897578,
|
|
"learning_rate": 3.8570144039837564e-05,
|
|
"loss": 0.2036,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15964803099632263,
|
|
"step": 945,
|
|
"valid_targets_mean": 4909.3,
|
|
"valid_targets_min": 2298
|
|
},
|
|
{
|
|
"epoch": 1.4728682170542635,
|
|
"grad_norm": 0.39582842776828425,
|
|
"learning_rate": 3.854129456075495e-05,
|
|
"loss": 0.2138,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1935088038444519,
|
|
"step": 950,
|
|
"valid_targets_mean": 5237.1,
|
|
"valid_targets_min": 2445
|
|
},
|
|
{
|
|
"epoch": 1.4806201550387597,
|
|
"grad_norm": 0.4768595855727291,
|
|
"learning_rate": 3.8512167950344916e-05,
|
|
"loss": 0.2198,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24240124225616455,
|
|
"step": 955,
|
|
"valid_targets_mean": 4105.6,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 1.4883720930232558,
|
|
"grad_norm": 0.4935988281203597,
|
|
"learning_rate": 3.848276464395445e-05,
|
|
"loss": 0.2062,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24553832411766052,
|
|
"step": 960,
|
|
"valid_targets_mean": 4142.4,
|
|
"valid_targets_min": 821
|
|
},
|
|
{
|
|
"epoch": 1.496124031007752,
|
|
"grad_norm": 0.3508044933691806,
|
|
"learning_rate": 3.8453085081066195e-05,
|
|
"loss": 0.1977,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1662253439426422,
|
|
"step": 965,
|
|
"valid_targets_mean": 5088.2,
|
|
"valid_targets_min": 869
|
|
},
|
|
{
|
|
"epoch": 1.503875968992248,
|
|
"grad_norm": 0.40679599062954963,
|
|
"learning_rate": 3.842312970529193e-05,
|
|
"loss": 0.2284,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2687034010887146,
|
|
"step": 970,
|
|
"valid_targets_mean": 5584.9,
|
|
"valid_targets_min": 265
|
|
},
|
|
{
|
|
"epoch": 1.5116279069767442,
|
|
"grad_norm": 0.5352927860483538,
|
|
"learning_rate": 3.839289896436592e-05,
|
|
"loss": 0.2209,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24231748282909393,
|
|
"step": 975,
|
|
"valid_targets_mean": 3208.9,
|
|
"valid_targets_min": 401
|
|
},
|
|
{
|
|
"epoch": 1.5193798449612403,
|
|
"grad_norm": 0.4748472407205153,
|
|
"learning_rate": 3.836239331013825e-05,
|
|
"loss": 0.2151,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18979281187057495,
|
|
"step": 980,
|
|
"valid_targets_mean": 3701.5,
|
|
"valid_targets_min": 455
|
|
},
|
|
{
|
|
"epoch": 1.5271317829457365,
|
|
"grad_norm": 0.345182798324371,
|
|
"learning_rate": 3.8331613198568056e-05,
|
|
"loss": 0.1933,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.164521723985672,
|
|
"step": 985,
|
|
"valid_targets_mean": 5305.6,
|
|
"valid_targets_min": 2154
|
|
},
|
|
{
|
|
"epoch": 1.5348837209302326,
|
|
"grad_norm": 0.34148764388998604,
|
|
"learning_rate": 3.830055908971668e-05,
|
|
"loss": 0.1917,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1817236989736557,
|
|
"step": 990,
|
|
"valid_targets_mean": 5507.2,
|
|
"valid_targets_min": 322
|
|
},
|
|
{
|
|
"epoch": 1.5426356589147288,
|
|
"grad_norm": 0.3914530838647767,
|
|
"learning_rate": 3.8269231447740844e-05,
|
|
"loss": 0.2134,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18969038128852844,
|
|
"step": 995,
|
|
"valid_targets_mean": 5196.0,
|
|
"valid_targets_min": 827
|
|
},
|
|
{
|
|
"epoch": 1.550387596899225,
|
|
"grad_norm": 0.39571077331421817,
|
|
"learning_rate": 3.823763074088568e-05,
|
|
"loss": 0.2054,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.209140807390213,
|
|
"step": 1000,
|
|
"valid_targets_mean": 5359.5,
|
|
"valid_targets_min": 1861
|
|
},
|
|
{
|
|
"epoch": 1.558139534883721,
|
|
"grad_norm": 0.3713493032556294,
|
|
"learning_rate": 3.8205757441477755e-05,
|
|
"loss": 0.2178,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1935080587863922,
|
|
"step": 1005,
|
|
"valid_targets_mean": 5409.0,
|
|
"valid_targets_min": 2022
|
|
},
|
|
{
|
|
"epoch": 1.5658914728682172,
|
|
"grad_norm": 0.40758343223754234,
|
|
"learning_rate": 3.8173612025917984e-05,
|
|
"loss": 0.216,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19840386509895325,
|
|
"step": 1010,
|
|
"valid_targets_mean": 5117.1,
|
|
"valid_targets_min": 590
|
|
},
|
|
{
|
|
"epoch": 1.5736434108527133,
|
|
"grad_norm": 0.3957074242428162,
|
|
"learning_rate": 3.8141194974674534e-05,
|
|
"loss": 0.2104,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20921745896339417,
|
|
"step": 1015,
|
|
"valid_targets_mean": 4456.0,
|
|
"valid_targets_min": 391
|
|
},
|
|
{
|
|
"epoch": 1.5813953488372094,
|
|
"grad_norm": 0.3733502693439458,
|
|
"learning_rate": 3.810850677227561e-05,
|
|
"loss": 0.2013,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16597923636436462,
|
|
"step": 1020,
|
|
"valid_targets_mean": 4493.0,
|
|
"valid_targets_min": 529
|
|
},
|
|
{
|
|
"epoch": 1.5891472868217056,
|
|
"grad_norm": 0.3628573096363499,
|
|
"learning_rate": 3.8075547907302255e-05,
|
|
"loss": 0.2158,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20087650418281555,
|
|
"step": 1025,
|
|
"valid_targets_mean": 5676.1,
|
|
"valid_targets_min": 1946
|
|
},
|
|
{
|
|
"epoch": 1.5968992248062015,
|
|
"grad_norm": 0.4127367151722258,
|
|
"learning_rate": 3.804231887238103e-05,
|
|
"loss": 0.1975,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2233181893825531,
|
|
"step": 1030,
|
|
"valid_targets_mean": 4449.3,
|
|
"valid_targets_min": 977
|
|
},
|
|
{
|
|
"epoch": 1.6046511627906976,
|
|
"grad_norm": 0.3649731232133132,
|
|
"learning_rate": 3.800882016417662e-05,
|
|
"loss": 0.2217,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16599664092063904,
|
|
"step": 1035,
|
|
"valid_targets_mean": 4848.2,
|
|
"valid_targets_min": 1859
|
|
},
|
|
{
|
|
"epoch": 1.6124031007751938,
|
|
"grad_norm": 0.46927973730672984,
|
|
"learning_rate": 3.797505228338447e-05,
|
|
"loss": 0.2065,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2043415606021881,
|
|
"step": 1040,
|
|
"valid_targets_mean": 3859.1,
|
|
"valid_targets_min": 658
|
|
},
|
|
{
|
|
"epoch": 1.62015503875969,
|
|
"grad_norm": 0.452023920939608,
|
|
"learning_rate": 3.794101573472325e-05,
|
|
"loss": 0.1983,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24635906517505646,
|
|
"step": 1045,
|
|
"valid_targets_mean": 4854.6,
|
|
"valid_targets_min": 712
|
|
},
|
|
{
|
|
"epoch": 1.627906976744186,
|
|
"grad_norm": 0.41920457500146513,
|
|
"learning_rate": 3.7906711026927344e-05,
|
|
"loss": 0.1927,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21003258228302002,
|
|
"step": 1050,
|
|
"valid_targets_mean": 4362.9,
|
|
"valid_targets_min": 2643
|
|
},
|
|
{
|
|
"epoch": 1.6356589147286822,
|
|
"grad_norm": 0.46857169083181116,
|
|
"learning_rate": 3.787213867273921e-05,
|
|
"loss": 0.2055,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2265489399433136,
|
|
"step": 1055,
|
|
"valid_targets_mean": 4190.8,
|
|
"valid_targets_min": 1976
|
|
},
|
|
{
|
|
"epoch": 1.6434108527131783,
|
|
"grad_norm": 0.4767624399813519,
|
|
"learning_rate": 3.783729918890176e-05,
|
|
"loss": 0.2186,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17004413902759552,
|
|
"step": 1060,
|
|
"valid_targets_mean": 5151.8,
|
|
"valid_targets_min": 734
|
|
},
|
|
{
|
|
"epoch": 1.6511627906976745,
|
|
"grad_norm": 0.3947749262809709,
|
|
"learning_rate": 3.780219309615061e-05,
|
|
"loss": 0.2164,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20741719007492065,
|
|
"step": 1065,
|
|
"valid_targets_mean": 4775.2,
|
|
"valid_targets_min": 2041
|
|
},
|
|
{
|
|
"epoch": 1.6589147286821704,
|
|
"grad_norm": 0.3652762324269706,
|
|
"learning_rate": 3.7766820919206294e-05,
|
|
"loss": 0.2074,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1898358166217804,
|
|
"step": 1070,
|
|
"valid_targets_mean": 5115.6,
|
|
"valid_targets_min": 395
|
|
},
|
|
{
|
|
"epoch": 1.6666666666666665,
|
|
"grad_norm": 0.4172044880561881,
|
|
"learning_rate": 3.7731183186766444e-05,
|
|
"loss": 0.2037,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19984492659568787,
|
|
"step": 1075,
|
|
"valid_targets_mean": 4925.4,
|
|
"valid_targets_min": 2372
|
|
},
|
|
{
|
|
"epoch": 1.6744186046511627,
|
|
"grad_norm": 0.37343486351450866,
|
|
"learning_rate": 3.7695280431497845e-05,
|
|
"loss": 0.2067,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21672552824020386,
|
|
"step": 1080,
|
|
"valid_targets_mean": 5672.4,
|
|
"valid_targets_min": 3114
|
|
},
|
|
{
|
|
"epoch": 1.6821705426356588,
|
|
"grad_norm": 0.4094562646804994,
|
|
"learning_rate": 3.765911319002854e-05,
|
|
"loss": 0.2256,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2076679766178131,
|
|
"step": 1085,
|
|
"valid_targets_mean": 4861.9,
|
|
"valid_targets_min": 351
|
|
},
|
|
{
|
|
"epoch": 1.689922480620155,
|
|
"grad_norm": 0.31444076763215517,
|
|
"learning_rate": 3.762268200293973e-05,
|
|
"loss": 0.1921,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13465389609336853,
|
|
"step": 1090,
|
|
"valid_targets_mean": 4960.0,
|
|
"valid_targets_min": 566
|
|
},
|
|
{
|
|
"epoch": 1.697674418604651,
|
|
"grad_norm": 0.4339023669513262,
|
|
"learning_rate": 3.7585987414757774e-05,
|
|
"loss": 0.2153,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1692432165145874,
|
|
"step": 1095,
|
|
"valid_targets_mean": 3976.5,
|
|
"valid_targets_min": 1131
|
|
},
|
|
{
|
|
"epoch": 1.7054263565891472,
|
|
"grad_norm": 0.493759660874177,
|
|
"learning_rate": 3.754902997394597e-05,
|
|
"loss": 0.2076,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20814771950244904,
|
|
"step": 1100,
|
|
"valid_targets_mean": 4421.8,
|
|
"valid_targets_min": 682
|
|
},
|
|
{
|
|
"epoch": 1.7131782945736433,
|
|
"grad_norm": 0.39667125615949944,
|
|
"learning_rate": 3.7511810232896435e-05,
|
|
"loss": 0.2221,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24969351291656494,
|
|
"step": 1105,
|
|
"valid_targets_mean": 6635.4,
|
|
"valid_targets_min": 767
|
|
},
|
|
{
|
|
"epoch": 1.7209302325581395,
|
|
"grad_norm": 0.40845510116998796,
|
|
"learning_rate": 3.7474328747921776e-05,
|
|
"loss": 0.192,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2053869366645813,
|
|
"step": 1110,
|
|
"valid_targets_mean": 4257.3,
|
|
"valid_targets_min": 669
|
|
},
|
|
{
|
|
"epoch": 1.7286821705426356,
|
|
"grad_norm": 0.3654829840675916,
|
|
"learning_rate": 3.743658607924683e-05,
|
|
"loss": 0.2047,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20669598877429962,
|
|
"step": 1115,
|
|
"valid_targets_mean": 5434.2,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 1.7364341085271318,
|
|
"grad_norm": 0.437762903353236,
|
|
"learning_rate": 3.739858279100028e-05,
|
|
"loss": 0.1922,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2025665044784546,
|
|
"step": 1120,
|
|
"valid_targets_mean": 5428.5,
|
|
"valid_targets_min": 3371
|
|
},
|
|
{
|
|
"epoch": 1.744186046511628,
|
|
"grad_norm": 0.5392878995782371,
|
|
"learning_rate": 3.736031945120621e-05,
|
|
"loss": 0.2211,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22214415669441223,
|
|
"step": 1125,
|
|
"valid_targets_mean": 4204.6,
|
|
"valid_targets_min": 1972
|
|
},
|
|
{
|
|
"epoch": 1.751937984496124,
|
|
"grad_norm": 0.550987196574115,
|
|
"learning_rate": 3.732179663177559e-05,
|
|
"loss": 0.1964,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17631106078624725,
|
|
"step": 1130,
|
|
"valid_targets_mean": 5127.2,
|
|
"valid_targets_min": 2529
|
|
},
|
|
{
|
|
"epoch": 1.7596899224806202,
|
|
"grad_norm": 0.3704297654863633,
|
|
"learning_rate": 3.728301490849778e-05,
|
|
"loss": 0.2116,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18758273124694824,
|
|
"step": 1135,
|
|
"valid_targets_mean": 5341.6,
|
|
"valid_targets_min": 2320
|
|
},
|
|
{
|
|
"epoch": 1.7674418604651163,
|
|
"grad_norm": 0.466284801284017,
|
|
"learning_rate": 3.7243974861031915e-05,
|
|
"loss": 0.2052,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.27421271800994873,
|
|
"step": 1140,
|
|
"valid_targets_mean": 4469.6,
|
|
"valid_targets_min": 2055
|
|
},
|
|
{
|
|
"epoch": 1.7751937984496124,
|
|
"grad_norm": 0.4548187236481328,
|
|
"learning_rate": 3.720467707289819e-05,
|
|
"loss": 0.1848,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19912035763263702,
|
|
"step": 1145,
|
|
"valid_targets_mean": 5421.1,
|
|
"valid_targets_min": 297
|
|
},
|
|
{
|
|
"epoch": 1.7829457364341086,
|
|
"grad_norm": 0.4234654458795664,
|
|
"learning_rate": 3.7165122131469205e-05,
|
|
"loss": 0.1967,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20600225031375885,
|
|
"step": 1150,
|
|
"valid_targets_mean": 4677.9,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 1.7906976744186047,
|
|
"grad_norm": 0.4892297020617883,
|
|
"learning_rate": 3.712531062796114e-05,
|
|
"loss": 0.2302,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2325432002544403,
|
|
"step": 1155,
|
|
"valid_targets_mean": 3676.9,
|
|
"valid_targets_min": 378
|
|
},
|
|
{
|
|
"epoch": 1.7984496124031009,
|
|
"grad_norm": 0.4615952861064993,
|
|
"learning_rate": 3.708524315742494e-05,
|
|
"loss": 0.2095,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20138488709926605,
|
|
"step": 1160,
|
|
"valid_targets_mean": 3587.5,
|
|
"valid_targets_min": 649
|
|
},
|
|
{
|
|
"epoch": 1.806201550387597,
|
|
"grad_norm": 0.4107586531975636,
|
|
"learning_rate": 3.704492031873742e-05,
|
|
"loss": 0.2085,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18871745467185974,
|
|
"step": 1165,
|
|
"valid_targets_mean": 4104.7,
|
|
"valid_targets_min": 322
|
|
},
|
|
{
|
|
"epoch": 1.8139534883720931,
|
|
"grad_norm": 0.4364150036844027,
|
|
"learning_rate": 3.700434271459229e-05,
|
|
"loss": 0.1851,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18455129861831665,
|
|
"step": 1170,
|
|
"valid_targets_mean": 4351.6,
|
|
"valid_targets_min": 528
|
|
},
|
|
{
|
|
"epoch": 1.8217054263565893,
|
|
"grad_norm": 0.40802425859518093,
|
|
"learning_rate": 3.696351095149117e-05,
|
|
"loss": 0.2017,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20364965498447418,
|
|
"step": 1175,
|
|
"valid_targets_mean": 4112.6,
|
|
"valid_targets_min": 567
|
|
},
|
|
{
|
|
"epoch": 1.8294573643410854,
|
|
"grad_norm": 0.4032478517472396,
|
|
"learning_rate": 3.692242563973454e-05,
|
|
"loss": 0.2209,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.25360697507858276,
|
|
"step": 1180,
|
|
"valid_targets_mean": 5295.9,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 1.8372093023255816,
|
|
"grad_norm": 0.4614085026878937,
|
|
"learning_rate": 3.688108739341258e-05,
|
|
"loss": 0.1926,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20508089661598206,
|
|
"step": 1185,
|
|
"valid_targets_mean": 3781.7,
|
|
"valid_targets_min": 270
|
|
},
|
|
{
|
|
"epoch": 1.8449612403100775,
|
|
"grad_norm": 0.3802819813887152,
|
|
"learning_rate": 3.683949683039602e-05,
|
|
"loss": 0.2274,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20417264103889465,
|
|
"step": 1190,
|
|
"valid_targets_mean": 4810.9,
|
|
"valid_targets_min": 946
|
|
},
|
|
{
|
|
"epoch": 1.8527131782945736,
|
|
"grad_norm": 0.43348296046621254,
|
|
"learning_rate": 3.679765457232687e-05,
|
|
"loss": 0.2113,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19152264297008514,
|
|
"step": 1195,
|
|
"valid_targets_mean": 5837.1,
|
|
"valid_targets_min": 272
|
|
},
|
|
{
|
|
"epoch": 1.8604651162790697,
|
|
"grad_norm": 0.40270266495111867,
|
|
"learning_rate": 3.675556124460918e-05,
|
|
"loss": 0.2061,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18859389424324036,
|
|
"step": 1200,
|
|
"valid_targets_mean": 4652.8,
|
|
"valid_targets_min": 2805
|
|
},
|
|
{
|
|
"epoch": 1.8682170542635659,
|
|
"grad_norm": 0.3784724852972052,
|
|
"learning_rate": 3.6713217476399654e-05,
|
|
"loss": 0.2069,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22137880325317383,
|
|
"step": 1205,
|
|
"valid_targets_mean": 5666.8,
|
|
"valid_targets_min": 1380
|
|
},
|
|
{
|
|
"epoch": 1.875968992248062,
|
|
"grad_norm": 0.3563867466614007,
|
|
"learning_rate": 3.6670623900598264e-05,
|
|
"loss": 0.1915,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17663565278053284,
|
|
"step": 1210,
|
|
"valid_targets_mean": 4829.3,
|
|
"valid_targets_min": 2526
|
|
},
|
|
{
|
|
"epoch": 1.8837209302325582,
|
|
"grad_norm": 0.32541904092615365,
|
|
"learning_rate": 3.662778115383876e-05,
|
|
"loss": 0.2149,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1512431651353836,
|
|
"step": 1215,
|
|
"valid_targets_mean": 5500.1,
|
|
"valid_targets_min": 300
|
|
},
|
|
{
|
|
"epoch": 1.8914728682170543,
|
|
"grad_norm": 0.3562253665751596,
|
|
"learning_rate": 3.6584689876479206e-05,
|
|
"loss": 0.195,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16320425271987915,
|
|
"step": 1220,
|
|
"valid_targets_mean": 4741.8,
|
|
"valid_targets_min": 335
|
|
},
|
|
{
|
|
"epoch": 1.8992248062015504,
|
|
"grad_norm": 0.4242425218762759,
|
|
"learning_rate": 3.654135071259237e-05,
|
|
"loss": 0.2005,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18462225794792175,
|
|
"step": 1225,
|
|
"valid_targets_mean": 3879.1,
|
|
"valid_targets_min": 725
|
|
},
|
|
{
|
|
"epoch": 1.9069767441860463,
|
|
"grad_norm": 0.44990621216299576,
|
|
"learning_rate": 3.6497764309956104e-05,
|
|
"loss": 0.2089,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2571909725666046,
|
|
"step": 1230,
|
|
"valid_targets_mean": 5112.8,
|
|
"valid_targets_min": 2435
|
|
},
|
|
{
|
|
"epoch": 1.9147286821705425,
|
|
"grad_norm": 0.3514156745181372,
|
|
"learning_rate": 3.645393132004367e-05,
|
|
"loss": 0.2113,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2239769548177719,
|
|
"step": 1235,
|
|
"valid_targets_mean": 5990.8,
|
|
"valid_targets_min": 2526
|
|
},
|
|
{
|
|
"epoch": 1.9224806201550386,
|
|
"grad_norm": 0.4438288563404829,
|
|
"learning_rate": 3.640985239801399e-05,
|
|
"loss": 0.2021,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23280391097068787,
|
|
"step": 1240,
|
|
"valid_targets_mean": 3919.9,
|
|
"valid_targets_min": 339
|
|
},
|
|
{
|
|
"epoch": 1.9302325581395348,
|
|
"grad_norm": 0.42245513107437865,
|
|
"learning_rate": 3.636552820270189e-05,
|
|
"loss": 0.1932,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20294125378131866,
|
|
"step": 1245,
|
|
"valid_targets_mean": 4123.6,
|
|
"valid_targets_min": 608
|
|
},
|
|
{
|
|
"epoch": 1.937984496124031,
|
|
"grad_norm": 0.36173604376638907,
|
|
"learning_rate": 3.632095939660817e-05,
|
|
"loss": 0.1921,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19740913808345795,
|
|
"step": 1250,
|
|
"valid_targets_mean": 4450.7,
|
|
"valid_targets_min": 243
|
|
},
|
|
{
|
|
"epoch": 1.945736434108527,
|
|
"grad_norm": 0.4185963445294981,
|
|
"learning_rate": 3.627614664588981e-05,
|
|
"loss": 0.1975,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20765337347984314,
|
|
"step": 1255,
|
|
"valid_targets_mean": 4475.6,
|
|
"valid_targets_min": 614
|
|
},
|
|
{
|
|
"epoch": 1.9534883720930232,
|
|
"grad_norm": 0.38392441124931787,
|
|
"learning_rate": 3.623109062034994e-05,
|
|
"loss": 0.2078,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19816569983959198,
|
|
"step": 1260,
|
|
"valid_targets_mean": 4867.6,
|
|
"valid_targets_min": 655
|
|
},
|
|
{
|
|
"epoch": 1.9612403100775193,
|
|
"grad_norm": 0.43839350861224635,
|
|
"learning_rate": 3.618579199342783e-05,
|
|
"loss": 0.1831,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20989343523979187,
|
|
"step": 1265,
|
|
"valid_targets_mean": 4077.1,
|
|
"valid_targets_min": 860
|
|
},
|
|
{
|
|
"epoch": 1.9689922480620154,
|
|
"grad_norm": 0.4040165567082679,
|
|
"learning_rate": 3.614025144218887e-05,
|
|
"loss": 0.2062,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21057480573654175,
|
|
"step": 1270,
|
|
"valid_targets_mean": 4318.6,
|
|
"valid_targets_min": 573
|
|
},
|
|
{
|
|
"epoch": 1.9767441860465116,
|
|
"grad_norm": 0.43337547842383023,
|
|
"learning_rate": 3.60944696473144e-05,
|
|
"loss": 0.2247,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1987258493900299,
|
|
"step": 1275,
|
|
"valid_targets_mean": 4023.1,
|
|
"valid_targets_min": 526
|
|
},
|
|
{
|
|
"epoch": 1.9844961240310077,
|
|
"grad_norm": 0.3271715231556842,
|
|
"learning_rate": 3.604844729309158e-05,
|
|
"loss": 0.17,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17882460355758667,
|
|
"step": 1280,
|
|
"valid_targets_mean": 6442.8,
|
|
"valid_targets_min": 2484
|
|
},
|
|
{
|
|
"epoch": 1.9922480620155039,
|
|
"grad_norm": 0.40322376508720353,
|
|
"learning_rate": 3.6002185067403126e-05,
|
|
"loss": 0.2075,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21025332808494568,
|
|
"step": 1285,
|
|
"valid_targets_mean": 4968.1,
|
|
"valid_targets_min": 1984
|
|
},
|
|
{
|
|
"epoch": 2.0,
|
|
"grad_norm": 0.43384474464309075,
|
|
"learning_rate": 3.5955683661717045e-05,
|
|
"loss": 0.1963,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22120501101016998,
|
|
"step": 1290,
|
|
"valid_targets_mean": 3698.2,
|
|
"valid_targets_min": 549
|
|
},
|
|
{
|
|
"epoch": 2.007751937984496,
|
|
"grad_norm": 0.3930458616713528,
|
|
"learning_rate": 3.590894377107629e-05,
|
|
"loss": 0.186,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2099405825138092,
|
|
"step": 1295,
|
|
"valid_targets_mean": 5265.2,
|
|
"valid_targets_min": 528
|
|
},
|
|
{
|
|
"epoch": 2.0155038759689923,
|
|
"grad_norm": 0.3382222565954035,
|
|
"learning_rate": 3.586196609408841e-05,
|
|
"loss": 0.1884,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16293954849243164,
|
|
"step": 1300,
|
|
"valid_targets_mean": 5672.2,
|
|
"valid_targets_min": 2311
|
|
},
|
|
{
|
|
"epoch": 2.0232558139534884,
|
|
"grad_norm": 0.4908644970549336,
|
|
"learning_rate": 3.5814751332915025e-05,
|
|
"loss": 0.2064,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22366786003112793,
|
|
"step": 1305,
|
|
"valid_targets_mean": 3243.5,
|
|
"valid_targets_min": 628
|
|
},
|
|
{
|
|
"epoch": 2.0310077519379846,
|
|
"grad_norm": 0.3498811091866486,
|
|
"learning_rate": 3.576730019326144e-05,
|
|
"loss": 0.1841,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15233008563518524,
|
|
"step": 1310,
|
|
"valid_targets_mean": 4671.6,
|
|
"valid_targets_min": 529
|
|
},
|
|
{
|
|
"epoch": 2.0387596899224807,
|
|
"grad_norm": 0.413386188431943,
|
|
"learning_rate": 3.571961338436599e-05,
|
|
"loss": 0.1917,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18065381050109863,
|
|
"step": 1315,
|
|
"valid_targets_mean": 5047.1,
|
|
"valid_targets_min": 845
|
|
},
|
|
{
|
|
"epoch": 2.046511627906977,
|
|
"grad_norm": 0.37597109516074934,
|
|
"learning_rate": 3.567169161898954e-05,
|
|
"loss": 0.1994,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1616477519273758,
|
|
"step": 1320,
|
|
"valid_targets_mean": 4590.8,
|
|
"valid_targets_min": 941
|
|
},
|
|
{
|
|
"epoch": 2.054263565891473,
|
|
"grad_norm": 0.41487589705713607,
|
|
"learning_rate": 3.562353561340473e-05,
|
|
"loss": 0.2004,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1990424543619156,
|
|
"step": 1325,
|
|
"valid_targets_mean": 5129.2,
|
|
"valid_targets_min": 2305
|
|
},
|
|
{
|
|
"epoch": 2.062015503875969,
|
|
"grad_norm": 0.3711795564505497,
|
|
"learning_rate": 3.557514608738536e-05,
|
|
"loss": 0.18,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15171518921852112,
|
|
"step": 1330,
|
|
"valid_targets_mean": 4377.2,
|
|
"valid_targets_min": 575
|
|
},
|
|
{
|
|
"epoch": 2.0697674418604652,
|
|
"grad_norm": 0.4175667094746574,
|
|
"learning_rate": 3.552652376419557e-05,
|
|
"loss": 0.1822,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16562065482139587,
|
|
"step": 1335,
|
|
"valid_targets_mean": 4697.5,
|
|
"valid_targets_min": 286
|
|
},
|
|
{
|
|
"epoch": 2.0775193798449614,
|
|
"grad_norm": 0.4306958245785991,
|
|
"learning_rate": 3.5477669370579045e-05,
|
|
"loss": 0.2022,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1900160312652588,
|
|
"step": 1340,
|
|
"valid_targets_mean": 4857.3,
|
|
"valid_targets_min": 1846
|
|
},
|
|
{
|
|
"epoch": 2.0852713178294575,
|
|
"grad_norm": 0.4476150200629465,
|
|
"learning_rate": 3.542858363674819e-05,
|
|
"loss": 0.1807,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18552112579345703,
|
|
"step": 1345,
|
|
"valid_targets_mean": 6009.1,
|
|
"valid_targets_min": 314
|
|
},
|
|
{
|
|
"epoch": 2.0930232558139537,
|
|
"grad_norm": 1.2948036152332547,
|
|
"learning_rate": 3.537926729637316e-05,
|
|
"loss": 0.1985,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19947974383831024,
|
|
"step": 1350,
|
|
"valid_targets_mean": 5068.8,
|
|
"valid_targets_min": 2881
|
|
},
|
|
{
|
|
"epoch": 2.10077519379845,
|
|
"grad_norm": 0.41477365418280177,
|
|
"learning_rate": 3.532972108657093e-05,
|
|
"loss": 0.1777,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19240254163742065,
|
|
"step": 1355,
|
|
"valid_targets_mean": 4253.2,
|
|
"valid_targets_min": 434
|
|
},
|
|
{
|
|
"epoch": 2.108527131782946,
|
|
"grad_norm": 0.42076615883749335,
|
|
"learning_rate": 3.527994574789425e-05,
|
|
"loss": 0.1741,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1795780062675476,
|
|
"step": 1360,
|
|
"valid_targets_mean": 4628.8,
|
|
"valid_targets_min": 677
|
|
},
|
|
{
|
|
"epoch": 2.116279069767442,
|
|
"grad_norm": 0.3617903288384957,
|
|
"learning_rate": 3.5229942024320614e-05,
|
|
"loss": 0.1858,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1568509340286255,
|
|
"step": 1365,
|
|
"valid_targets_mean": 4954.9,
|
|
"valid_targets_min": 712
|
|
},
|
|
{
|
|
"epoch": 2.124031007751938,
|
|
"grad_norm": 0.5456999997368401,
|
|
"learning_rate": 3.517971066324111e-05,
|
|
"loss": 0.1914,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17306216061115265,
|
|
"step": 1370,
|
|
"valid_targets_mean": 3624.9,
|
|
"valid_targets_min": 335
|
|
},
|
|
{
|
|
"epoch": 2.1317829457364343,
|
|
"grad_norm": 0.38334555353165817,
|
|
"learning_rate": 3.512925241544925e-05,
|
|
"loss": 0.1877,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19654911756515503,
|
|
"step": 1375,
|
|
"valid_targets_mean": 5664.1,
|
|
"valid_targets_min": 1799
|
|
},
|
|
{
|
|
"epoch": 2.13953488372093,
|
|
"grad_norm": 0.43336348909756756,
|
|
"learning_rate": 3.5078568035129755e-05,
|
|
"loss": 0.1835,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2114173173904419,
|
|
"step": 1380,
|
|
"valid_targets_mean": 4490.0,
|
|
"valid_targets_min": 535
|
|
},
|
|
{
|
|
"epoch": 2.147286821705426,
|
|
"grad_norm": 0.43851230664405455,
|
|
"learning_rate": 3.502765827984731e-05,
|
|
"loss": 0.1816,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2103298455476761,
|
|
"step": 1385,
|
|
"valid_targets_mean": 4057.0,
|
|
"valid_targets_min": 2866
|
|
},
|
|
{
|
|
"epoch": 2.1550387596899223,
|
|
"grad_norm": 0.48397504627229887,
|
|
"learning_rate": 3.497652391053517e-05,
|
|
"loss": 0.186,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2291339933872223,
|
|
"step": 1390,
|
|
"valid_targets_mean": 4031.1,
|
|
"valid_targets_min": 630
|
|
},
|
|
{
|
|
"epoch": 2.1627906976744184,
|
|
"grad_norm": 0.4549549638224178,
|
|
"learning_rate": 3.492516569148388e-05,
|
|
"loss": 0.2142,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21782903373241425,
|
|
"step": 1395,
|
|
"valid_targets_mean": 4231.4,
|
|
"valid_targets_min": 2014
|
|
},
|
|
{
|
|
"epoch": 2.1705426356589146,
|
|
"grad_norm": 0.36020932761428015,
|
|
"learning_rate": 3.487358439032975e-05,
|
|
"loss": 0.1616,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18451038002967834,
|
|
"step": 1400,
|
|
"valid_targets_mean": 6068.2,
|
|
"valid_targets_min": 2874
|
|
},
|
|
{
|
|
"epoch": 2.1782945736434107,
|
|
"grad_norm": 0.3920924834443207,
|
|
"learning_rate": 3.4821780778043474e-05,
|
|
"loss": 0.1889,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1814422309398651,
|
|
"step": 1405,
|
|
"valid_targets_mean": 4700.9,
|
|
"valid_targets_min": 656
|
|
},
|
|
{
|
|
"epoch": 2.186046511627907,
|
|
"grad_norm": 0.3750763170625423,
|
|
"learning_rate": 3.4769755628918545e-05,
|
|
"loss": 0.1779,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1634986400604248,
|
|
"step": 1410,
|
|
"valid_targets_mean": 4980.3,
|
|
"valid_targets_min": 2167
|
|
},
|
|
{
|
|
"epoch": 2.193798449612403,
|
|
"grad_norm": 0.42291953615168815,
|
|
"learning_rate": 3.471750972055972e-05,
|
|
"loss": 0.1733,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16338089108467102,
|
|
"step": 1415,
|
|
"valid_targets_mean": 4139.0,
|
|
"valid_targets_min": 391
|
|
},
|
|
{
|
|
"epoch": 2.201550387596899,
|
|
"grad_norm": 0.4171884044672125,
|
|
"learning_rate": 3.466504383387135e-05,
|
|
"loss": 0.172,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1964506208896637,
|
|
"step": 1420,
|
|
"valid_targets_mean": 4754.2,
|
|
"valid_targets_min": 2815
|
|
},
|
|
{
|
|
"epoch": 2.2093023255813953,
|
|
"grad_norm": 0.3903545245483966,
|
|
"learning_rate": 3.461235875304577e-05,
|
|
"loss": 0.1848,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20105893909931183,
|
|
"step": 1425,
|
|
"valid_targets_mean": 4361.9,
|
|
"valid_targets_min": 250
|
|
},
|
|
{
|
|
"epoch": 2.2170542635658914,
|
|
"grad_norm": 0.3750810698508955,
|
|
"learning_rate": 3.455945526555153e-05,
|
|
"loss": 0.1867,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17983251810073853,
|
|
"step": 1430,
|
|
"valid_targets_mean": 5131.6,
|
|
"valid_targets_min": 2493
|
|
},
|
|
{
|
|
"epoch": 2.2248062015503876,
|
|
"grad_norm": 0.37223290231346184,
|
|
"learning_rate": 3.450633416212162e-05,
|
|
"loss": 0.1922,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16431176662445068,
|
|
"step": 1435,
|
|
"valid_targets_mean": 4377.4,
|
|
"valid_targets_min": 613
|
|
},
|
|
{
|
|
"epoch": 2.2325581395348837,
|
|
"grad_norm": 0.3352051342701091,
|
|
"learning_rate": 3.4452996236741744e-05,
|
|
"loss": 0.1976,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1869511604309082,
|
|
"step": 1440,
|
|
"valid_targets_mean": 5356.9,
|
|
"valid_targets_min": 2703
|
|
},
|
|
{
|
|
"epoch": 2.24031007751938,
|
|
"grad_norm": 0.432086006561443,
|
|
"learning_rate": 3.439944228663829e-05,
|
|
"loss": 0.2079,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21285605430603027,
|
|
"step": 1445,
|
|
"valid_targets_mean": 4237.8,
|
|
"valid_targets_min": 1886
|
|
},
|
|
{
|
|
"epoch": 2.248062015503876,
|
|
"grad_norm": 0.3275443973114785,
|
|
"learning_rate": 3.434567311226656e-05,
|
|
"loss": 0.1757,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15418857336044312,
|
|
"step": 1450,
|
|
"valid_targets_mean": 5285.2,
|
|
"valid_targets_min": 566
|
|
},
|
|
{
|
|
"epoch": 2.255813953488372,
|
|
"grad_norm": 0.3576878996712879,
|
|
"learning_rate": 3.4291689517298734e-05,
|
|
"loss": 0.1946,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.186420738697052,
|
|
"step": 1455,
|
|
"valid_targets_mean": 5496.6,
|
|
"valid_targets_min": 321
|
|
},
|
|
{
|
|
"epoch": 2.2635658914728682,
|
|
"grad_norm": 0.4962339025365947,
|
|
"learning_rate": 3.423749230861188e-05,
|
|
"loss": 0.1694,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17092068493366241,
|
|
"step": 1460,
|
|
"valid_targets_mean": 3222.7,
|
|
"valid_targets_min": 402
|
|
},
|
|
{
|
|
"epoch": 2.2713178294573644,
|
|
"grad_norm": 0.4812137783785399,
|
|
"learning_rate": 3.418308229627588e-05,
|
|
"loss": 0.2163,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.27093812823295593,
|
|
"step": 1465,
|
|
"valid_targets_mean": 4862.1,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 2.2790697674418605,
|
|
"grad_norm": 0.4153567019223971,
|
|
"learning_rate": 3.412846029354134e-05,
|
|
"loss": 0.1927,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.237184539437294,
|
|
"step": 1470,
|
|
"valid_targets_mean": 4620.6,
|
|
"valid_targets_min": 455
|
|
},
|
|
{
|
|
"epoch": 2.2868217054263567,
|
|
"grad_norm": 0.3426626225579909,
|
|
"learning_rate": 3.4073627116827425e-05,
|
|
"loss": 0.1781,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18062137067317963,
|
|
"step": 1475,
|
|
"valid_targets_mean": 5811.9,
|
|
"valid_targets_min": 2245
|
|
},
|
|
{
|
|
"epoch": 2.294573643410853,
|
|
"grad_norm": 0.38476093721663684,
|
|
"learning_rate": 3.4018583585709636e-05,
|
|
"loss": 0.1816,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18126948177814484,
|
|
"step": 1480,
|
|
"valid_targets_mean": 4559.2,
|
|
"valid_targets_min": 322
|
|
},
|
|
{
|
|
"epoch": 2.302325581395349,
|
|
"grad_norm": 0.4096766811442832,
|
|
"learning_rate": 3.39633305229076e-05,
|
|
"loss": 0.1877,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20921531319618225,
|
|
"step": 1485,
|
|
"valid_targets_mean": 5167.4,
|
|
"valid_targets_min": 684
|
|
},
|
|
{
|
|
"epoch": 2.310077519379845,
|
|
"grad_norm": 0.38639646068488026,
|
|
"learning_rate": 3.390786875427275e-05,
|
|
"loss": 0.1811,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15107879042625427,
|
|
"step": 1490,
|
|
"valid_targets_mean": 4523.8,
|
|
"valid_targets_min": 1865
|
|
},
|
|
{
|
|
"epoch": 2.317829457364341,
|
|
"grad_norm": 0.4502008909642411,
|
|
"learning_rate": 3.385219910877599e-05,
|
|
"loss": 0.2037,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1977536380290985,
|
|
"step": 1495,
|
|
"valid_targets_mean": 4173.2,
|
|
"valid_targets_min": 1948
|
|
},
|
|
{
|
|
"epoch": 2.3255813953488373,
|
|
"grad_norm": 0.3796879053543267,
|
|
"learning_rate": 3.3796322418495276e-05,
|
|
"loss": 0.1879,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1648637056350708,
|
|
"step": 1500,
|
|
"valid_targets_mean": 4416.7,
|
|
"valid_targets_min": 304
|
|
},
|
|
{
|
|
"epoch": 2.3333333333333335,
|
|
"grad_norm": 0.3789163353016251,
|
|
"learning_rate": 3.374023951860322e-05,
|
|
"loss": 0.1794,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1563669592142105,
|
|
"step": 1505,
|
|
"valid_targets_mean": 5124.2,
|
|
"valid_targets_min": 2981
|
|
},
|
|
{
|
|
"epoch": 2.3410852713178296,
|
|
"grad_norm": 0.41364685765156334,
|
|
"learning_rate": 3.368395124735459e-05,
|
|
"loss": 0.1893,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16633863747119904,
|
|
"step": 1510,
|
|
"valid_targets_mean": 3882.1,
|
|
"valid_targets_min": 282
|
|
},
|
|
{
|
|
"epoch": 2.3488372093023258,
|
|
"grad_norm": 0.35667587906507076,
|
|
"learning_rate": 3.3627458446073775e-05,
|
|
"loss": 0.1673,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13330259919166565,
|
|
"step": 1515,
|
|
"valid_targets_mean": 5481.6,
|
|
"valid_targets_min": 752
|
|
},
|
|
{
|
|
"epoch": 2.356589147286822,
|
|
"grad_norm": 0.3881816160616292,
|
|
"learning_rate": 3.357076195914221e-05,
|
|
"loss": 0.1789,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18566307425498962,
|
|
"step": 1520,
|
|
"valid_targets_mean": 5012.3,
|
|
"valid_targets_min": 1855
|
|
},
|
|
{
|
|
"epoch": 2.3643410852713176,
|
|
"grad_norm": 0.4712604845214267,
|
|
"learning_rate": 3.351386263398578e-05,
|
|
"loss": 0.1833,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19617591798305511,
|
|
"step": 1525,
|
|
"valid_targets_mean": 4073.4,
|
|
"valid_targets_min": 477
|
|
},
|
|
{
|
|
"epoch": 2.3720930232558137,
|
|
"grad_norm": 0.35048104567381255,
|
|
"learning_rate": 3.34567613210621e-05,
|
|
"loss": 0.1856,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17707285284996033,
|
|
"step": 1530,
|
|
"valid_targets_mean": 5311.7,
|
|
"valid_targets_min": 968
|
|
},
|
|
{
|
|
"epoch": 2.37984496124031,
|
|
"grad_norm": 0.41501213355240485,
|
|
"learning_rate": 3.3399458873847865e-05,
|
|
"loss": 0.1839,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18096289038658142,
|
|
"step": 1535,
|
|
"valid_targets_mean": 4257.4,
|
|
"valid_targets_min": 2687
|
|
},
|
|
{
|
|
"epoch": 2.387596899224806,
|
|
"grad_norm": 0.3935199588486319,
|
|
"learning_rate": 3.334195614882606e-05,
|
|
"loss": 0.2009,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23064912855625153,
|
|
"step": 1540,
|
|
"valid_targets_mean": 5280.2,
|
|
"valid_targets_min": 726
|
|
},
|
|
{
|
|
"epoch": 2.395348837209302,
|
|
"grad_norm": 0.39245757715509993,
|
|
"learning_rate": 3.3284254005473164e-05,
|
|
"loss": 0.1729,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14799197018146515,
|
|
"step": 1545,
|
|
"valid_targets_mean": 4357.3,
|
|
"valid_targets_min": 365
|
|
},
|
|
{
|
|
"epoch": 2.4031007751937983,
|
|
"grad_norm": 0.3960910530726775,
|
|
"learning_rate": 3.3226353306246296e-05,
|
|
"loss": 0.1802,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16391268372535706,
|
|
"step": 1550,
|
|
"valid_targets_mean": 4675.7,
|
|
"valid_targets_min": 472
|
|
},
|
|
{
|
|
"epoch": 2.4108527131782944,
|
|
"grad_norm": 0.399983594538759,
|
|
"learning_rate": 3.316825491657033e-05,
|
|
"loss": 0.1814,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18162378668785095,
|
|
"step": 1555,
|
|
"valid_targets_mean": 4586.7,
|
|
"valid_targets_min": 336
|
|
},
|
|
{
|
|
"epoch": 2.4186046511627906,
|
|
"grad_norm": 0.4339613073850326,
|
|
"learning_rate": 3.310995970482498e-05,
|
|
"loss": 0.1812,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18091610074043274,
|
|
"step": 1560,
|
|
"valid_targets_mean": 4878.5,
|
|
"valid_targets_min": 1433
|
|
},
|
|
{
|
|
"epoch": 2.4263565891472867,
|
|
"grad_norm": 0.40487359759812325,
|
|
"learning_rate": 3.3051468542331784e-05,
|
|
"loss": 0.1959,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17559471726417542,
|
|
"step": 1565,
|
|
"valid_targets_mean": 4204.3,
|
|
"valid_targets_min": 1999
|
|
},
|
|
{
|
|
"epoch": 2.434108527131783,
|
|
"grad_norm": 0.37204854898669026,
|
|
"learning_rate": 3.2992782303341104e-05,
|
|
"loss": 0.1642,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1342979371547699,
|
|
"step": 1570,
|
|
"valid_targets_mean": 4676.9,
|
|
"valid_targets_min": 720
|
|
},
|
|
{
|
|
"epoch": 2.441860465116279,
|
|
"grad_norm": 0.43162119589856907,
|
|
"learning_rate": 3.2933901865019064e-05,
|
|
"loss": 0.203,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2307354062795639,
|
|
"step": 1575,
|
|
"valid_targets_mean": 4931.0,
|
|
"valid_targets_min": 1914
|
|
},
|
|
{
|
|
"epoch": 2.449612403100775,
|
|
"grad_norm": 0.4576769904055123,
|
|
"learning_rate": 3.28748281074344e-05,
|
|
"loss": 0.1707,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15882378816604614,
|
|
"step": 1580,
|
|
"valid_targets_mean": 3951.5,
|
|
"valid_targets_min": 1846
|
|
},
|
|
{
|
|
"epoch": 2.4573643410852712,
|
|
"grad_norm": 0.4015392257462172,
|
|
"learning_rate": 3.281556191354538e-05,
|
|
"loss": 0.1666,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15286649763584137,
|
|
"step": 1585,
|
|
"valid_targets_mean": 5152.0,
|
|
"valid_targets_min": 285
|
|
},
|
|
{
|
|
"epoch": 2.4651162790697674,
|
|
"grad_norm": 0.42917005882818327,
|
|
"learning_rate": 3.2756104169186524e-05,
|
|
"loss": 0.1729,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17661848664283752,
|
|
"step": 1590,
|
|
"valid_targets_mean": 4086.8,
|
|
"valid_targets_min": 568
|
|
},
|
|
{
|
|
"epoch": 2.4728682170542635,
|
|
"grad_norm": 0.4411320746574963,
|
|
"learning_rate": 3.269645576305541e-05,
|
|
"loss": 0.1927,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.184126615524292,
|
|
"step": 1595,
|
|
"valid_targets_mean": 6700.9,
|
|
"valid_targets_min": 2494
|
|
},
|
|
{
|
|
"epoch": 2.4806201550387597,
|
|
"grad_norm": 0.4047963399547679,
|
|
"learning_rate": 3.2636617586699375e-05,
|
|
"loss": 0.1773,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16849125921726227,
|
|
"step": 1600,
|
|
"valid_targets_mean": 4574.2,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 2.488372093023256,
|
|
"grad_norm": 0.44245747159170795,
|
|
"learning_rate": 3.257659053450223e-05,
|
|
"loss": 0.188,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20396322011947632,
|
|
"step": 1605,
|
|
"valid_targets_mean": 4482.4,
|
|
"valid_targets_min": 380
|
|
},
|
|
{
|
|
"epoch": 2.496124031007752,
|
|
"grad_norm": 0.43654194588770506,
|
|
"learning_rate": 3.251637550367082e-05,
|
|
"loss": 0.1768,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19797450304031372,
|
|
"step": 1610,
|
|
"valid_targets_mean": 4816.7,
|
|
"valid_targets_min": 2959
|
|
},
|
|
{
|
|
"epoch": 2.503875968992248,
|
|
"grad_norm": 0.43464122667550903,
|
|
"learning_rate": 3.245597339422165e-05,
|
|
"loss": 0.1815,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1967172473669052,
|
|
"step": 1615,
|
|
"valid_targets_mean": 5667.7,
|
|
"valid_targets_min": 559
|
|
},
|
|
{
|
|
"epoch": 2.511627906976744,
|
|
"grad_norm": 0.4652650203493568,
|
|
"learning_rate": 3.2395385108967486e-05,
|
|
"loss": 0.1801,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19761139154434204,
|
|
"step": 1620,
|
|
"valid_targets_mean": 4328.9,
|
|
"valid_targets_min": 314
|
|
},
|
|
{
|
|
"epoch": 2.5193798449612403,
|
|
"grad_norm": 0.40709753507837126,
|
|
"learning_rate": 3.233461155350375e-05,
|
|
"loss": 0.1843,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20508559048175812,
|
|
"step": 1625,
|
|
"valid_targets_mean": 5249.1,
|
|
"valid_targets_min": 216
|
|
},
|
|
{
|
|
"epoch": 2.5271317829457365,
|
|
"grad_norm": 0.4491598648675841,
|
|
"learning_rate": 3.227365363619507e-05,
|
|
"loss": 0.1918,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1938488781452179,
|
|
"step": 1630,
|
|
"valid_targets_mean": 3739.8,
|
|
"valid_targets_min": 2192
|
|
},
|
|
{
|
|
"epoch": 2.5348837209302326,
|
|
"grad_norm": 0.4742827982147315,
|
|
"learning_rate": 3.221251226816168e-05,
|
|
"loss": 0.1906,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17324459552764893,
|
|
"step": 1635,
|
|
"valid_targets_mean": 3619.9,
|
|
"valid_targets_min": 325
|
|
},
|
|
{
|
|
"epoch": 2.5426356589147288,
|
|
"grad_norm": 0.40634153675562273,
|
|
"learning_rate": 3.21511883632658e-05,
|
|
"loss": 0.1762,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17292270064353943,
|
|
"step": 1640,
|
|
"valid_targets_mean": 4721.2,
|
|
"valid_targets_min": 1866
|
|
},
|
|
{
|
|
"epoch": 2.550387596899225,
|
|
"grad_norm": 0.3502337789022322,
|
|
"learning_rate": 3.208968283809795e-05,
|
|
"loss": 0.1679,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13709160685539246,
|
|
"step": 1645,
|
|
"valid_targets_mean": 5043.9,
|
|
"valid_targets_min": 1925
|
|
},
|
|
{
|
|
"epoch": 2.558139534883721,
|
|
"grad_norm": 0.46216095941040614,
|
|
"learning_rate": 3.202799661196331e-05,
|
|
"loss": 0.1881,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22641834616661072,
|
|
"step": 1650,
|
|
"valid_targets_mean": 4146.6,
|
|
"valid_targets_min": 419
|
|
},
|
|
{
|
|
"epoch": 2.565891472868217,
|
|
"grad_norm": 0.3770036373887086,
|
|
"learning_rate": 3.196613060686791e-05,
|
|
"loss": 0.2024,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19278298318386078,
|
|
"step": 1655,
|
|
"valid_targets_mean": 5648.9,
|
|
"valid_targets_min": 1948
|
|
},
|
|
{
|
|
"epoch": 2.5736434108527133,
|
|
"grad_norm": 0.3885989041243395,
|
|
"learning_rate": 3.1904085747504927e-05,
|
|
"loss": 0.179,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17080789804458618,
|
|
"step": 1660,
|
|
"valid_targets_mean": 4642.9,
|
|
"valid_targets_min": 357
|
|
},
|
|
{
|
|
"epoch": 2.5813953488372094,
|
|
"grad_norm": 0.4011197982513075,
|
|
"learning_rate": 3.184186296124077e-05,
|
|
"loss": 0.1885,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1865064799785614,
|
|
"step": 1665,
|
|
"valid_targets_mean": 5166.7,
|
|
"valid_targets_min": 330
|
|
},
|
|
{
|
|
"epoch": 2.5891472868217056,
|
|
"grad_norm": 0.3745953386421688,
|
|
"learning_rate": 3.1779463178101317e-05,
|
|
"loss": 0.1844,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17259354889392853,
|
|
"step": 1670,
|
|
"valid_targets_mean": 4452.9,
|
|
"valid_targets_min": 2554
|
|
},
|
|
{
|
|
"epoch": 2.5968992248062017,
|
|
"grad_norm": 0.4235759003308612,
|
|
"learning_rate": 3.1716887330757935e-05,
|
|
"loss": 0.1797,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17030495405197144,
|
|
"step": 1675,
|
|
"valid_targets_mean": 4332.0,
|
|
"valid_targets_min": 2478
|
|
},
|
|
{
|
|
"epoch": 2.604651162790698,
|
|
"grad_norm": 0.4854637458573741,
|
|
"learning_rate": 3.165413635451358e-05,
|
|
"loss": 0.1711,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19602999091148376,
|
|
"step": 1680,
|
|
"valid_targets_mean": 3863.3,
|
|
"valid_targets_min": 355
|
|
},
|
|
{
|
|
"epoch": 2.612403100775194,
|
|
"grad_norm": 0.40699113598693853,
|
|
"learning_rate": 3.159121118728882e-05,
|
|
"loss": 0.1901,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18548724055290222,
|
|
"step": 1685,
|
|
"valid_targets_mean": 4666.2,
|
|
"valid_targets_min": 1840
|
|
},
|
|
{
|
|
"epoch": 2.62015503875969,
|
|
"grad_norm": 0.34544920663620954,
|
|
"learning_rate": 3.152811276960778e-05,
|
|
"loss": 0.1751,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14782579243183136,
|
|
"step": 1690,
|
|
"valid_targets_mean": 5451.3,
|
|
"valid_targets_min": 285
|
|
},
|
|
{
|
|
"epoch": 2.6279069767441863,
|
|
"grad_norm": 0.3927708940246696,
|
|
"learning_rate": 3.1464842044584134e-05,
|
|
"loss": 0.1937,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15799960494041443,
|
|
"step": 1695,
|
|
"valid_targets_mean": 5175.1,
|
|
"valid_targets_min": 719
|
|
},
|
|
{
|
|
"epoch": 2.6356589147286824,
|
|
"grad_norm": 0.40704479344798744,
|
|
"learning_rate": 3.140139995790697e-05,
|
|
"loss": 0.1888,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21562063694000244,
|
|
"step": 1700,
|
|
"valid_targets_mean": 4840.2,
|
|
"valid_targets_min": 330
|
|
},
|
|
{
|
|
"epoch": 2.6434108527131785,
|
|
"grad_norm": 0.4492192562060312,
|
|
"learning_rate": 3.1337787457826676e-05,
|
|
"loss": 0.2064,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20294302701950073,
|
|
"step": 1705,
|
|
"valid_targets_mean": 4130.9,
|
|
"valid_targets_min": 836
|
|
},
|
|
{
|
|
"epoch": 2.6511627906976747,
|
|
"grad_norm": 0.439737875037387,
|
|
"learning_rate": 3.127400549514075e-05,
|
|
"loss": 0.1844,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22795331478118896,
|
|
"step": 1710,
|
|
"valid_targets_mean": 4858.8,
|
|
"valid_targets_min": 566
|
|
},
|
|
{
|
|
"epoch": 2.6589147286821704,
|
|
"grad_norm": 0.3937483563358435,
|
|
"learning_rate": 3.121005502317961e-05,
|
|
"loss": 0.1773,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14470066130161285,
|
|
"step": 1715,
|
|
"valid_targets_mean": 4338.8,
|
|
"valid_targets_min": 808
|
|
},
|
|
{
|
|
"epoch": 2.6666666666666665,
|
|
"grad_norm": 0.43258662767772366,
|
|
"learning_rate": 3.114593699779233e-05,
|
|
"loss": 0.1793,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18938937783241272,
|
|
"step": 1720,
|
|
"valid_targets_mean": 4000.3,
|
|
"valid_targets_min": 2352
|
|
},
|
|
{
|
|
"epoch": 2.6744186046511627,
|
|
"grad_norm": 0.38825080259416433,
|
|
"learning_rate": 3.108165237733235e-05,
|
|
"loss": 0.1896,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20304493606090546,
|
|
"step": 1725,
|
|
"valid_targets_mean": 5271.6,
|
|
"valid_targets_min": 2162
|
|
},
|
|
{
|
|
"epoch": 2.682170542635659,
|
|
"grad_norm": 0.5030719627542097,
|
|
"learning_rate": 3.101720212264315e-05,
|
|
"loss": 0.1836,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1815469115972519,
|
|
"step": 1730,
|
|
"valid_targets_mean": 3065.4,
|
|
"valid_targets_min": 304
|
|
},
|
|
{
|
|
"epoch": 2.689922480620155,
|
|
"grad_norm": 0.48074649750101905,
|
|
"learning_rate": 3.0952587197043916e-05,
|
|
"loss": 0.1565,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1928318440914154,
|
|
"step": 1735,
|
|
"valid_targets_mean": 3592.6,
|
|
"valid_targets_min": 639
|
|
},
|
|
{
|
|
"epoch": 2.697674418604651,
|
|
"grad_norm": 0.38224384351415913,
|
|
"learning_rate": 3.0887808566315123e-05,
|
|
"loss": 0.1699,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16647925972938538,
|
|
"step": 1740,
|
|
"valid_targets_mean": 4713.6,
|
|
"valid_targets_min": 639
|
|
},
|
|
{
|
|
"epoch": 2.705426356589147,
|
|
"grad_norm": 0.33777469296551843,
|
|
"learning_rate": 3.0822867198684076e-05,
|
|
"loss": 0.1617,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15009137988090515,
|
|
"step": 1745,
|
|
"valid_targets_mean": 6850.4,
|
|
"valid_targets_min": 2445
|
|
},
|
|
{
|
|
"epoch": 2.7131782945736433,
|
|
"grad_norm": 0.44540770518271033,
|
|
"learning_rate": 3.075776406481048e-05,
|
|
"loss": 0.185,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18640130758285522,
|
|
"step": 1750,
|
|
"valid_targets_mean": 4726.7,
|
|
"valid_targets_min": 1933
|
|
},
|
|
{
|
|
"epoch": 2.7209302325581395,
|
|
"grad_norm": 0.44372094538107276,
|
|
"learning_rate": 3.0692500137771926e-05,
|
|
"loss": 0.183,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22654184699058533,
|
|
"step": 1755,
|
|
"valid_targets_mean": 3954.4,
|
|
"valid_targets_min": 606
|
|
},
|
|
{
|
|
"epoch": 2.7286821705426356,
|
|
"grad_norm": 0.369529532189345,
|
|
"learning_rate": 3.062707639304928e-05,
|
|
"loss": 0.1822,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17843511700630188,
|
|
"step": 1760,
|
|
"valid_targets_mean": 5725.1,
|
|
"valid_targets_min": 1885
|
|
},
|
|
{
|
|
"epoch": 2.7364341085271318,
|
|
"grad_norm": 0.40621309446299825,
|
|
"learning_rate": 3.0561493808512216e-05,
|
|
"loss": 0.1589,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21624553203582764,
|
|
"step": 1765,
|
|
"valid_targets_mean": 4932.4,
|
|
"valid_targets_min": 2437
|
|
},
|
|
{
|
|
"epoch": 2.744186046511628,
|
|
"grad_norm": 0.4324605534368406,
|
|
"learning_rate": 3.0495753364404513e-05,
|
|
"loss": 0.1693,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1789764165878296,
|
|
"step": 1770,
|
|
"valid_targets_mean": 4427.4,
|
|
"valid_targets_min": 1030
|
|
},
|
|
{
|
|
"epoch": 2.751937984496124,
|
|
"grad_norm": 0.44772637547939986,
|
|
"learning_rate": 3.042985604332943e-05,
|
|
"loss": 0.1807,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21675977110862732,
|
|
"step": 1775,
|
|
"valid_targets_mean": 4327.5,
|
|
"valid_targets_min": 783
|
|
},
|
|
{
|
|
"epoch": 2.75968992248062,
|
|
"grad_norm": 0.3320961105254609,
|
|
"learning_rate": 3.036380283023502e-05,
|
|
"loss": 0.1697,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15626108646392822,
|
|
"step": 1780,
|
|
"valid_targets_mean": 5396.8,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 2.7674418604651163,
|
|
"grad_norm": 0.37789640533310415,
|
|
"learning_rate": 3.0297594712399428e-05,
|
|
"loss": 0.1933,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15670335292816162,
|
|
"step": 1785,
|
|
"valid_targets_mean": 4688.8,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 2.7751937984496124,
|
|
"grad_norm": 0.40427238608967736,
|
|
"learning_rate": 3.0231232679416088e-05,
|
|
"loss": 0.1932,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2058807611465454,
|
|
"step": 1790,
|
|
"valid_targets_mean": 4991.1,
|
|
"valid_targets_min": 2320
|
|
},
|
|
{
|
|
"epoch": 2.7829457364341086,
|
|
"grad_norm": 0.3958864673220442,
|
|
"learning_rate": 3.0164717723178976e-05,
|
|
"loss": 0.1758,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1790355145931244,
|
|
"step": 1795,
|
|
"valid_targets_mean": 4758.6,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 2.7906976744186047,
|
|
"grad_norm": 0.3482330544899987,
|
|
"learning_rate": 3.0098050837867755e-05,
|
|
"loss": 0.183,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15739408135414124,
|
|
"step": 1800,
|
|
"valid_targets_mean": 5299.1,
|
|
"valid_targets_min": 957
|
|
},
|
|
{
|
|
"epoch": 2.798449612403101,
|
|
"grad_norm": 0.41439611401362086,
|
|
"learning_rate": 3.003123301993295e-05,
|
|
"loss": 0.171,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16220103204250336,
|
|
"step": 1805,
|
|
"valid_targets_mean": 4676.3,
|
|
"valid_targets_min": 1825
|
|
},
|
|
{
|
|
"epoch": 2.806201550387597,
|
|
"grad_norm": 0.41973002932333475,
|
|
"learning_rate": 2.9964265268081e-05,
|
|
"loss": 0.1814,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15398794412612915,
|
|
"step": 1810,
|
|
"valid_targets_mean": 3951.7,
|
|
"valid_targets_min": 308
|
|
},
|
|
{
|
|
"epoch": 2.813953488372093,
|
|
"grad_norm": 0.41316632273979337,
|
|
"learning_rate": 2.9897148583259386e-05,
|
|
"loss": 0.1996,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21641714870929718,
|
|
"step": 1815,
|
|
"valid_targets_mean": 4523.2,
|
|
"valid_targets_min": 630
|
|
},
|
|
{
|
|
"epoch": 2.8217054263565893,
|
|
"grad_norm": 0.44522140399389565,
|
|
"learning_rate": 2.982988396864165e-05,
|
|
"loss": 0.1832,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18898218870162964,
|
|
"step": 1820,
|
|
"valid_targets_mean": 4400.8,
|
|
"valid_targets_min": 996
|
|
},
|
|
{
|
|
"epoch": 2.8294573643410854,
|
|
"grad_norm": 0.3738531998626034,
|
|
"learning_rate": 2.9762472429612375e-05,
|
|
"loss": 0.1813,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15361550450325012,
|
|
"step": 1825,
|
|
"valid_targets_mean": 4821.5,
|
|
"valid_targets_min": 978
|
|
},
|
|
{
|
|
"epoch": 2.8372093023255816,
|
|
"grad_norm": 0.43083740204233706,
|
|
"learning_rate": 2.9694914973752194e-05,
|
|
"loss": 0.1722,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1844104826450348,
|
|
"step": 1830,
|
|
"valid_targets_mean": 3693.3,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 2.8449612403100772,
|
|
"grad_norm": 0.3659912670375286,
|
|
"learning_rate": 2.962721261082272e-05,
|
|
"loss": 0.1889,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20017662644386292,
|
|
"step": 1835,
|
|
"valid_targets_mean": 6980.4,
|
|
"valid_targets_min": 3136
|
|
},
|
|
{
|
|
"epoch": 2.8527131782945734,
|
|
"grad_norm": 0.4567000170536253,
|
|
"learning_rate": 2.9559366352751445e-05,
|
|
"loss": 0.1919,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23465114831924438,
|
|
"step": 1840,
|
|
"valid_targets_mean": 4588.8,
|
|
"valid_targets_min": 2486
|
|
},
|
|
{
|
|
"epoch": 2.8604651162790695,
|
|
"grad_norm": 0.40929029223114577,
|
|
"learning_rate": 2.9491377213616618e-05,
|
|
"loss": 0.1747,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18239933252334595,
|
|
"step": 1845,
|
|
"valid_targets_mean": 4133.6,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 2.8682170542635657,
|
|
"grad_norm": 0.40525101121640406,
|
|
"learning_rate": 2.94232462096321e-05,
|
|
"loss": 0.1865,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1767432689666748,
|
|
"step": 1850,
|
|
"valid_targets_mean": 4216.1,
|
|
"valid_targets_min": 516
|
|
},
|
|
{
|
|
"epoch": 2.875968992248062,
|
|
"grad_norm": 0.4366325773783958,
|
|
"learning_rate": 2.9354974359132135e-05,
|
|
"loss": 0.1826,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19949214160442352,
|
|
"step": 1855,
|
|
"valid_targets_mean": 4033.6,
|
|
"valid_targets_min": 1922
|
|
},
|
|
{
|
|
"epoch": 2.883720930232558,
|
|
"grad_norm": 0.42935985240712937,
|
|
"learning_rate": 2.92865626825562e-05,
|
|
"loss": 0.1783,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18675842881202698,
|
|
"step": 1860,
|
|
"valid_targets_mean": 4010.4,
|
|
"valid_targets_min": 946
|
|
},
|
|
{
|
|
"epoch": 2.891472868217054,
|
|
"grad_norm": 0.31457168919286277,
|
|
"learning_rate": 2.921801220243368e-05,
|
|
"loss": 0.1585,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13208898901939392,
|
|
"step": 1865,
|
|
"valid_targets_mean": 6431.9,
|
|
"valid_targets_min": 2510
|
|
},
|
|
{
|
|
"epoch": 2.89922480620155,
|
|
"grad_norm": 0.39154537620319585,
|
|
"learning_rate": 2.9149323943368635e-05,
|
|
"loss": 0.1779,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15021896362304688,
|
|
"step": 1870,
|
|
"valid_targets_mean": 5320.4,
|
|
"valid_targets_min": 2104
|
|
},
|
|
{
|
|
"epoch": 2.9069767441860463,
|
|
"grad_norm": 0.4215081843896084,
|
|
"learning_rate": 2.9080498932024462e-05,
|
|
"loss": 0.1708,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19808581471443176,
|
|
"step": 1875,
|
|
"valid_targets_mean": 4261.8,
|
|
"valid_targets_min": 434
|
|
},
|
|
{
|
|
"epoch": 2.9147286821705425,
|
|
"grad_norm": 0.48180287200478444,
|
|
"learning_rate": 2.901153819710855e-05,
|
|
"loss": 0.1831,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20577339828014374,
|
|
"step": 1880,
|
|
"valid_targets_mean": 3915.2,
|
|
"valid_targets_min": 551
|
|
},
|
|
{
|
|
"epoch": 2.9224806201550386,
|
|
"grad_norm": 0.4046284897843421,
|
|
"learning_rate": 2.8942442769356896e-05,
|
|
"loss": 0.1648,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20008404552936554,
|
|
"step": 1885,
|
|
"valid_targets_mean": 5054.2,
|
|
"valid_targets_min": 2545
|
|
},
|
|
{
|
|
"epoch": 2.9302325581395348,
|
|
"grad_norm": 0.3202021785981192,
|
|
"learning_rate": 2.8873213681518747e-05,
|
|
"loss": 0.1676,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14765912294387817,
|
|
"step": 1890,
|
|
"valid_targets_mean": 5971.2,
|
|
"valid_targets_min": 1835
|
|
},
|
|
{
|
|
"epoch": 2.937984496124031,
|
|
"grad_norm": 0.3975741557425795,
|
|
"learning_rate": 2.8803851968341092e-05,
|
|
"loss": 0.1965,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17159457504749298,
|
|
"step": 1895,
|
|
"valid_targets_mean": 4565.2,
|
|
"valid_targets_min": 1942
|
|
},
|
|
{
|
|
"epoch": 2.945736434108527,
|
|
"grad_norm": 0.46251815005036806,
|
|
"learning_rate": 2.873435866655326e-05,
|
|
"loss": 0.1843,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24192339181900024,
|
|
"step": 1900,
|
|
"valid_targets_mean": 4237.6,
|
|
"valid_targets_min": 326
|
|
},
|
|
{
|
|
"epoch": 2.953488372093023,
|
|
"grad_norm": 0.41403119618696854,
|
|
"learning_rate": 2.8664734814851377e-05,
|
|
"loss": 0.1783,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18902885913848877,
|
|
"step": 1905,
|
|
"valid_targets_mean": 4557.3,
|
|
"valid_targets_min": 849
|
|
},
|
|
{
|
|
"epoch": 2.9612403100775193,
|
|
"grad_norm": 0.44851409111675167,
|
|
"learning_rate": 2.8594981453882874e-05,
|
|
"loss": 0.1656,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20263975858688354,
|
|
"step": 1910,
|
|
"valid_targets_mean": 3717.8,
|
|
"valid_targets_min": 926
|
|
},
|
|
{
|
|
"epoch": 2.9689922480620154,
|
|
"grad_norm": 0.42903678457431993,
|
|
"learning_rate": 2.85250996262309e-05,
|
|
"loss": 0.1957,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23578867316246033,
|
|
"step": 1915,
|
|
"valid_targets_mean": 4934.7,
|
|
"valid_targets_min": 685
|
|
},
|
|
{
|
|
"epoch": 2.9767441860465116,
|
|
"grad_norm": 0.7267563478310851,
|
|
"learning_rate": 2.8455090376398783e-05,
|
|
"loss": 0.1792,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18642187118530273,
|
|
"step": 1920,
|
|
"valid_targets_mean": 4939.8,
|
|
"valid_targets_min": 2461
|
|
},
|
|
{
|
|
"epoch": 2.9844961240310077,
|
|
"grad_norm": 0.45652911775394833,
|
|
"learning_rate": 2.8384954750794383e-05,
|
|
"loss": 0.1679,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1863420158624649,
|
|
"step": 1925,
|
|
"valid_targets_mean": 4101.9,
|
|
"valid_targets_min": 386
|
|
},
|
|
{
|
|
"epoch": 2.992248062015504,
|
|
"grad_norm": 0.4162197137776795,
|
|
"learning_rate": 2.8314693797714453e-05,
|
|
"loss": 0.1786,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16806048154830933,
|
|
"step": 1930,
|
|
"valid_targets_mean": 3889.9,
|
|
"valid_targets_min": 266
|
|
},
|
|
{
|
|
"epoch": 3.0,
|
|
"grad_norm": 0.4173426583399949,
|
|
"learning_rate": 2.8244308567328995e-05,
|
|
"loss": 0.1705,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1593976765871048,
|
|
"step": 1935,
|
|
"valid_targets_mean": 3841.9,
|
|
"valid_targets_min": 725
|
|
},
|
|
{
|
|
"epoch": 3.007751937984496,
|
|
"grad_norm": 0.31143453647713937,
|
|
"learning_rate": 2.8173800111665534e-05,
|
|
"loss": 0.1603,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1310623288154602,
|
|
"step": 1940,
|
|
"valid_targets_mean": 6594.8,
|
|
"valid_targets_min": 3125
|
|
},
|
|
{
|
|
"epoch": 3.0155038759689923,
|
|
"grad_norm": 0.37798360065942155,
|
|
"learning_rate": 2.8103169484593408e-05,
|
|
"loss": 0.1671,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14523474872112274,
|
|
"step": 1945,
|
|
"valid_targets_mean": 4545.6,
|
|
"valid_targets_min": 391
|
|
},
|
|
{
|
|
"epoch": 3.0232558139534884,
|
|
"grad_norm": 0.4193657818911918,
|
|
"learning_rate": 2.8032417741808026e-05,
|
|
"loss": 0.1825,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19101709127426147,
|
|
"step": 1950,
|
|
"valid_targets_mean": 4638.9,
|
|
"valid_targets_min": 1098
|
|
},
|
|
{
|
|
"epoch": 3.0310077519379846,
|
|
"grad_norm": 0.4292392293342452,
|
|
"learning_rate": 2.7961545940815073e-05,
|
|
"loss": 0.1683,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14101950824260712,
|
|
"step": 1955,
|
|
"valid_targets_mean": 4463.8,
|
|
"valid_targets_min": 734
|
|
},
|
|
{
|
|
"epoch": 3.0387596899224807,
|
|
"grad_norm": 0.445566159385126,
|
|
"learning_rate": 2.7890555140914712e-05,
|
|
"loss": 0.1761,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15082740783691406,
|
|
"step": 1960,
|
|
"valid_targets_mean": 4373.4,
|
|
"valid_targets_min": 196
|
|
},
|
|
{
|
|
"epoch": 3.046511627906977,
|
|
"grad_norm": 0.3879287131571122,
|
|
"learning_rate": 2.7819446403185737e-05,
|
|
"loss": 0.1633,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.155793234705925,
|
|
"step": 1965,
|
|
"valid_targets_mean": 4823.5,
|
|
"valid_targets_min": 424
|
|
},
|
|
{
|
|
"epoch": 3.054263565891473,
|
|
"grad_norm": 0.4580658977138339,
|
|
"learning_rate": 2.774822079046973e-05,
|
|
"loss": 0.1615,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1928856372833252,
|
|
"step": 1970,
|
|
"valid_targets_mean": 4411.8,
|
|
"valid_targets_min": 994
|
|
},
|
|
{
|
|
"epoch": 3.062015503875969,
|
|
"grad_norm": 0.37791164078529926,
|
|
"learning_rate": 2.7676879367355182e-05,
|
|
"loss": 0.1947,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22396092116832733,
|
|
"step": 1975,
|
|
"valid_targets_mean": 6053.8,
|
|
"valid_targets_min": 341
|
|
},
|
|
{
|
|
"epoch": 3.0697674418604652,
|
|
"grad_norm": 0.5813711025395043,
|
|
"learning_rate": 2.7605423200161544e-05,
|
|
"loss": 0.1766,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20629319548606873,
|
|
"step": 1980,
|
|
"valid_targets_mean": 2834.8,
|
|
"valid_targets_min": 594
|
|
},
|
|
{
|
|
"epoch": 3.0775193798449614,
|
|
"grad_norm": 0.5229150181707595,
|
|
"learning_rate": 2.753385335692334e-05,
|
|
"loss": 0.1801,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19532498717308044,
|
|
"step": 1985,
|
|
"valid_targets_mean": 5435.9,
|
|
"valid_targets_min": 2333
|
|
},
|
|
{
|
|
"epoch": 3.0852713178294575,
|
|
"grad_norm": 0.5039292916210872,
|
|
"learning_rate": 2.7462170907374152e-05,
|
|
"loss": 0.2046,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2393975555896759,
|
|
"step": 1990,
|
|
"valid_targets_mean": 3852.1,
|
|
"valid_targets_min": 621
|
|
},
|
|
{
|
|
"epoch": 3.0930232558139537,
|
|
"grad_norm": 0.4334986389248226,
|
|
"learning_rate": 2.7390376922930676e-05,
|
|
"loss": 0.1536,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2017873227596283,
|
|
"step": 1995,
|
|
"valid_targets_mean": 4789.2,
|
|
"valid_targets_min": 578
|
|
},
|
|
{
|
|
"epoch": 3.10077519379845,
|
|
"grad_norm": 0.48940426768725165,
|
|
"learning_rate": 2.7318472476676678e-05,
|
|
"loss": 0.1677,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20767296850681305,
|
|
"step": 2000,
|
|
"valid_targets_mean": 4572.1,
|
|
"valid_targets_min": 564
|
|
},
|
|
{
|
|
"epoch": 3.108527131782946,
|
|
"grad_norm": 0.45021483225829007,
|
|
"learning_rate": 2.7246458643346954e-05,
|
|
"loss": 0.1722,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19874969124794006,
|
|
"step": 2005,
|
|
"valid_targets_mean": 4382.3,
|
|
"valid_targets_min": 400
|
|
},
|
|
{
|
|
"epoch": 3.116279069767442,
|
|
"grad_norm": 0.39974386281581625,
|
|
"learning_rate": 2.7174336499311306e-05,
|
|
"loss": 0.1615,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15649522840976715,
|
|
"step": 2010,
|
|
"valid_targets_mean": 4884.1,
|
|
"valid_targets_min": 1197
|
|
},
|
|
{
|
|
"epoch": 3.124031007751938,
|
|
"grad_norm": 0.4810534052770901,
|
|
"learning_rate": 2.7102107122558388e-05,
|
|
"loss": 0.1697,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.196878120303154,
|
|
"step": 2015,
|
|
"valid_targets_mean": 4465.6,
|
|
"valid_targets_min": 422
|
|
},
|
|
{
|
|
"epoch": 3.1317829457364343,
|
|
"grad_norm": 0.4405420076380904,
|
|
"learning_rate": 2.7029771592679667e-05,
|
|
"loss": 0.1832,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2112666368484497,
|
|
"step": 2020,
|
|
"valid_targets_mean": 4233.7,
|
|
"valid_targets_min": 2211
|
|
},
|
|
{
|
|
"epoch": 3.13953488372093,
|
|
"grad_norm": 0.435544733463545,
|
|
"learning_rate": 2.695733099085322e-05,
|
|
"loss": 0.1738,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1643523871898651,
|
|
"step": 2025,
|
|
"valid_targets_mean": 4607.8,
|
|
"valid_targets_min": 313
|
|
},
|
|
{
|
|
"epoch": 3.147286821705426,
|
|
"grad_norm": 0.39286659071704916,
|
|
"learning_rate": 2.6884786399827617e-05,
|
|
"loss": 0.1654,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1477556824684143,
|
|
"step": 2030,
|
|
"valid_targets_mean": 4724.6,
|
|
"valid_targets_min": 1978
|
|
},
|
|
{
|
|
"epoch": 3.1550387596899223,
|
|
"grad_norm": 0.3724002460323432,
|
|
"learning_rate": 2.6812138903905725e-05,
|
|
"loss": 0.1646,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16990327835083008,
|
|
"step": 2035,
|
|
"valid_targets_mean": 4912.9,
|
|
"valid_targets_min": 2789
|
|
},
|
|
{
|
|
"epoch": 3.1627906976744184,
|
|
"grad_norm": 0.3944253467485725,
|
|
"learning_rate": 2.6739389588928496e-05,
|
|
"loss": 0.1538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15294812619686127,
|
|
"step": 2040,
|
|
"valid_targets_mean": 4411.3,
|
|
"valid_targets_min": 470
|
|
},
|
|
{
|
|
"epoch": 3.1705426356589146,
|
|
"grad_norm": 0.4077204261905621,
|
|
"learning_rate": 2.6666539542258742e-05,
|
|
"loss": 0.1918,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2099585086107254,
|
|
"step": 2045,
|
|
"valid_targets_mean": 5898.4,
|
|
"valid_targets_min": 2703
|
|
},
|
|
{
|
|
"epoch": 3.1782945736434107,
|
|
"grad_norm": 0.3700464997656355,
|
|
"learning_rate": 2.6593589852764886e-05,
|
|
"loss": 0.1866,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17447850108146667,
|
|
"step": 2050,
|
|
"valid_targets_mean": 5101.3,
|
|
"valid_targets_min": 242
|
|
},
|
|
{
|
|
"epoch": 3.186046511627907,
|
|
"grad_norm": 0.4095360723042356,
|
|
"learning_rate": 2.6520541610804688e-05,
|
|
"loss": 0.1655,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18860718607902527,
|
|
"step": 2055,
|
|
"valid_targets_mean": 4771.2,
|
|
"valid_targets_min": 2471
|
|
},
|
|
{
|
|
"epoch": 3.193798449612403,
|
|
"grad_norm": 0.42170127535958324,
|
|
"learning_rate": 2.6447395908208933e-05,
|
|
"loss": 0.1719,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19056911766529083,
|
|
"step": 2060,
|
|
"valid_targets_mean": 4609.7,
|
|
"valid_targets_min": 487
|
|
},
|
|
{
|
|
"epoch": 3.201550387596899,
|
|
"grad_norm": 0.3731793258953492,
|
|
"learning_rate": 2.6374153838265117e-05,
|
|
"loss": 0.1551,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14581088721752167,
|
|
"step": 2065,
|
|
"valid_targets_mean": 4326.2,
|
|
"valid_targets_min": 282
|
|
},
|
|
{
|
|
"epoch": 3.2093023255813953,
|
|
"grad_norm": 0.39762533461899896,
|
|
"learning_rate": 2.6300816495701124e-05,
|
|
"loss": 0.1697,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15880948305130005,
|
|
"step": 2070,
|
|
"valid_targets_mean": 4789.0,
|
|
"valid_targets_min": 1925
|
|
},
|
|
{
|
|
"epoch": 3.2170542635658914,
|
|
"grad_norm": 0.44748063624921613,
|
|
"learning_rate": 2.6227384976668848e-05,
|
|
"loss": 0.1763,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.170176699757576,
|
|
"step": 2075,
|
|
"valid_targets_mean": 3995.2,
|
|
"valid_targets_min": 1668
|
|
},
|
|
{
|
|
"epoch": 3.2248062015503876,
|
|
"grad_norm": 0.36135621157101455,
|
|
"learning_rate": 2.6153860378727805e-05,
|
|
"loss": 0.1568,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1492878496646881,
|
|
"step": 2080,
|
|
"valid_targets_mean": 4992.2,
|
|
"valid_targets_min": 330
|
|
},
|
|
{
|
|
"epoch": 3.2325581395348837,
|
|
"grad_norm": 0.4154124841987222,
|
|
"learning_rate": 2.6080243800828742e-05,
|
|
"loss": 0.1655,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17003397643566132,
|
|
"step": 2085,
|
|
"valid_targets_mean": 4658.8,
|
|
"valid_targets_min": 1209
|
|
},
|
|
{
|
|
"epoch": 3.24031007751938,
|
|
"grad_norm": 0.37368780763861736,
|
|
"learning_rate": 2.600653634329719e-05,
|
|
"loss": 0.1793,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1633392572402954,
|
|
"step": 2090,
|
|
"valid_targets_mean": 4566.2,
|
|
"valid_targets_min": 2411
|
|
},
|
|
{
|
|
"epoch": 3.248062015503876,
|
|
"grad_norm": 0.3979676356096421,
|
|
"learning_rate": 2.593273910781705e-05,
|
|
"loss": 0.1634,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17785364389419556,
|
|
"step": 2095,
|
|
"valid_targets_mean": 4691.6,
|
|
"valid_targets_min": 432
|
|
},
|
|
{
|
|
"epoch": 3.255813953488372,
|
|
"grad_norm": 0.4225515784722321,
|
|
"learning_rate": 2.585885319741409e-05,
|
|
"loss": 0.1782,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18224605917930603,
|
|
"step": 2100,
|
|
"valid_targets_mean": 4253.3,
|
|
"valid_targets_min": 756
|
|
},
|
|
{
|
|
"epoch": 3.2635658914728682,
|
|
"grad_norm": 0.38016881244736056,
|
|
"learning_rate": 2.5784879716439495e-05,
|
|
"loss": 0.1527,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12859958410263062,
|
|
"step": 2105,
|
|
"valid_targets_mean": 3910.2,
|
|
"valid_targets_min": 549
|
|
},
|
|
{
|
|
"epoch": 3.2713178294573644,
|
|
"grad_norm": 0.5201402499872219,
|
|
"learning_rate": 2.5710819770553322e-05,
|
|
"loss": 0.1521,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15190503001213074,
|
|
"step": 2110,
|
|
"valid_targets_mean": 4282.5,
|
|
"valid_targets_min": 460
|
|
},
|
|
{
|
|
"epoch": 3.2790697674418605,
|
|
"grad_norm": 0.36744579209677214,
|
|
"learning_rate": 2.5636674466708002e-05,
|
|
"loss": 0.1595,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14565041661262512,
|
|
"step": 2115,
|
|
"valid_targets_mean": 4384.2,
|
|
"valid_targets_min": 328
|
|
},
|
|
{
|
|
"epoch": 3.2868217054263567,
|
|
"grad_norm": 0.41793705033807765,
|
|
"learning_rate": 2.5562444913131802e-05,
|
|
"loss": 0.1838,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16959373652935028,
|
|
"step": 2120,
|
|
"valid_targets_mean": 4006.3,
|
|
"valid_targets_min": 412
|
|
},
|
|
{
|
|
"epoch": 3.294573643410853,
|
|
"grad_norm": 0.4168288113393459,
|
|
"learning_rate": 2.548813221931221e-05,
|
|
"loss": 0.1637,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15278933942317963,
|
|
"step": 2125,
|
|
"valid_targets_mean": 4835.8,
|
|
"valid_targets_min": 1716
|
|
},
|
|
{
|
|
"epoch": 3.302325581395349,
|
|
"grad_norm": 0.43979678843894293,
|
|
"learning_rate": 2.5413737495979426e-05,
|
|
"loss": 0.1674,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16088305413722992,
|
|
"step": 2130,
|
|
"valid_targets_mean": 4291.2,
|
|
"valid_targets_min": 2104
|
|
},
|
|
{
|
|
"epoch": 3.310077519379845,
|
|
"grad_norm": 0.3934052531036587,
|
|
"learning_rate": 2.5339261855089694e-05,
|
|
"loss": 0.1657,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15298032760620117,
|
|
"step": 2135,
|
|
"valid_targets_mean": 4588.1,
|
|
"valid_targets_min": 329
|
|
},
|
|
{
|
|
"epoch": 3.317829457364341,
|
|
"grad_norm": 0.36169781906861537,
|
|
"learning_rate": 2.5264706409808725e-05,
|
|
"loss": 0.1795,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16061750054359436,
|
|
"step": 2140,
|
|
"valid_targets_mean": 5402.7,
|
|
"valid_targets_min": 709
|
|
},
|
|
{
|
|
"epoch": 3.3255813953488373,
|
|
"grad_norm": 0.4010813470774762,
|
|
"learning_rate": 2.5190072274495028e-05,
|
|
"loss": 0.1711,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1538451462984085,
|
|
"step": 2145,
|
|
"valid_targets_mean": 4433.6,
|
|
"valid_targets_min": 339
|
|
},
|
|
{
|
|
"epoch": 3.3333333333333335,
|
|
"grad_norm": 0.3582230333794788,
|
|
"learning_rate": 2.511536056468328e-05,
|
|
"loss": 0.1496,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13346490263938904,
|
|
"step": 2150,
|
|
"valid_targets_mean": 4958.1,
|
|
"valid_targets_min": 676
|
|
},
|
|
{
|
|
"epoch": 3.3410852713178296,
|
|
"grad_norm": 0.4020066100217078,
|
|
"learning_rate": 2.5040572397067645e-05,
|
|
"loss": 0.1679,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19228683412075043,
|
|
"step": 2155,
|
|
"valid_targets_mean": 5232.5,
|
|
"valid_targets_min": 760
|
|
},
|
|
{
|
|
"epoch": 3.3488372093023258,
|
|
"grad_norm": 0.3855313842797188,
|
|
"learning_rate": 2.4965708889485062e-05,
|
|
"loss": 0.1718,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17724131047725677,
|
|
"step": 2160,
|
|
"valid_targets_mean": 4920.0,
|
|
"valid_targets_min": 1946
|
|
},
|
|
{
|
|
"epoch": 3.356589147286822,
|
|
"grad_norm": 0.4532744687578762,
|
|
"learning_rate": 2.489077116089858e-05,
|
|
"loss": 0.1914,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22503584623336792,
|
|
"step": 2165,
|
|
"valid_targets_mean": 4651.2,
|
|
"valid_targets_min": 272
|
|
},
|
|
{
|
|
"epoch": 3.3643410852713176,
|
|
"grad_norm": 0.4366754770288092,
|
|
"learning_rate": 2.4815760331380578e-05,
|
|
"loss": 0.1911,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2072749137878418,
|
|
"step": 2170,
|
|
"valid_targets_mean": 4974.6,
|
|
"valid_targets_min": 450
|
|
},
|
|
{
|
|
"epoch": 3.3720930232558137,
|
|
"grad_norm": 0.5215057560813444,
|
|
"learning_rate": 2.4740677522096078e-05,
|
|
"loss": 0.1689,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2247978001832962,
|
|
"step": 2175,
|
|
"valid_targets_mean": 3434.2,
|
|
"valid_targets_min": 352
|
|
},
|
|
{
|
|
"epoch": 3.37984496124031,
|
|
"grad_norm": 0.43695153967165795,
|
|
"learning_rate": 2.4665523855285954e-05,
|
|
"loss": 0.163,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1621866375207901,
|
|
"step": 2180,
|
|
"valid_targets_mean": 3792.3,
|
|
"valid_targets_min": 364
|
|
},
|
|
{
|
|
"epoch": 3.387596899224806,
|
|
"grad_norm": 0.40940303711183107,
|
|
"learning_rate": 2.4590300454250164e-05,
|
|
"loss": 0.1444,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14481836557388306,
|
|
"step": 2185,
|
|
"valid_targets_mean": 4906.2,
|
|
"valid_targets_min": 2115
|
|
},
|
|
{
|
|
"epoch": 3.395348837209302,
|
|
"grad_norm": 0.41242022872473294,
|
|
"learning_rate": 2.4515008443330963e-05,
|
|
"loss": 0.1706,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16337113082408905,
|
|
"step": 2190,
|
|
"valid_targets_mean": 4234.1,
|
|
"valid_targets_min": 339
|
|
},
|
|
{
|
|
"epoch": 3.4031007751937983,
|
|
"grad_norm": 0.34565747520342643,
|
|
"learning_rate": 2.4439648947896103e-05,
|
|
"loss": 0.1771,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14244988560676575,
|
|
"step": 2195,
|
|
"valid_targets_mean": 5911.4,
|
|
"valid_targets_min": 216
|
|
},
|
|
{
|
|
"epoch": 3.4108527131782944,
|
|
"grad_norm": 0.47813710313391616,
|
|
"learning_rate": 2.4364223094322004e-05,
|
|
"loss": 0.1674,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16893121600151062,
|
|
"step": 2200,
|
|
"valid_targets_mean": 4232.1,
|
|
"valid_targets_min": 284
|
|
},
|
|
{
|
|
"epoch": 3.4186046511627906,
|
|
"grad_norm": 0.41110932893026,
|
|
"learning_rate": 2.4288732009976928e-05,
|
|
"loss": 0.1566,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14816223084926605,
|
|
"step": 2205,
|
|
"valid_targets_mean": 4381.5,
|
|
"valid_targets_min": 2163
|
|
},
|
|
{
|
|
"epoch": 3.4263565891472867,
|
|
"grad_norm": 0.4329916569520111,
|
|
"learning_rate": 2.4213176823204103e-05,
|
|
"loss": 0.1709,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15532240271568298,
|
|
"step": 2210,
|
|
"valid_targets_mean": 3792.0,
|
|
"valid_targets_min": 575
|
|
},
|
|
{
|
|
"epoch": 3.434108527131783,
|
|
"grad_norm": 0.47293777686859195,
|
|
"learning_rate": 2.4137558663304907e-05,
|
|
"loss": 0.1868,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17490163445472717,
|
|
"step": 2215,
|
|
"valid_targets_mean": 4627.6,
|
|
"valid_targets_min": 304
|
|
},
|
|
{
|
|
"epoch": 3.441860465116279,
|
|
"grad_norm": 0.42026578348250343,
|
|
"learning_rate": 2.4061878660521927e-05,
|
|
"loss": 0.1764,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14874975383281708,
|
|
"step": 2220,
|
|
"valid_targets_mean": 3723.0,
|
|
"valid_targets_min": 2346
|
|
},
|
|
{
|
|
"epoch": 3.449612403100775,
|
|
"grad_norm": 0.5448600259555658,
|
|
"learning_rate": 2.3986137946022132e-05,
|
|
"loss": 0.1755,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23847255110740662,
|
|
"step": 2225,
|
|
"valid_targets_mean": 3648.1,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 3.4573643410852712,
|
|
"grad_norm": 0.3526959052609803,
|
|
"learning_rate": 2.3910337651879902e-05,
|
|
"loss": 0.1745,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15136197209358215,
|
|
"step": 2230,
|
|
"valid_targets_mean": 5305.6,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 3.4651162790697674,
|
|
"grad_norm": 0.4609105179523114,
|
|
"learning_rate": 2.3834478911060144e-05,
|
|
"loss": 0.1824,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1996048092842102,
|
|
"step": 2235,
|
|
"valid_targets_mean": 4194.4,
|
|
"valid_targets_min": 628
|
|
},
|
|
{
|
|
"epoch": 3.4728682170542635,
|
|
"grad_norm": 0.3632917288631249,
|
|
"learning_rate": 2.3758562857401365e-05,
|
|
"loss": 0.1818,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14042022824287415,
|
|
"step": 2240,
|
|
"valid_targets_mean": 4892.4,
|
|
"valid_targets_min": 431
|
|
},
|
|
{
|
|
"epoch": 3.4806201550387597,
|
|
"grad_norm": 0.3596297602071797,
|
|
"learning_rate": 2.3682590625598682e-05,
|
|
"loss": 0.1664,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1568746566772461,
|
|
"step": 2245,
|
|
"valid_targets_mean": 5468.7,
|
|
"valid_targets_min": 818
|
|
},
|
|
{
|
|
"epoch": 3.488372093023256,
|
|
"grad_norm": 0.36656096196128835,
|
|
"learning_rate": 2.360656335118692e-05,
|
|
"loss": 0.1764,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15595552325248718,
|
|
"step": 2250,
|
|
"valid_targets_mean": 4770.1,
|
|
"valid_targets_min": 330
|
|
},
|
|
{
|
|
"epoch": 3.496124031007752,
|
|
"grad_norm": 0.4048396000613103,
|
|
"learning_rate": 2.3530482170523604e-05,
|
|
"loss": 0.1691,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2218673974275589,
|
|
"step": 2255,
|
|
"valid_targets_mean": 4977.7,
|
|
"valid_targets_min": 346
|
|
},
|
|
{
|
|
"epoch": 3.503875968992248,
|
|
"grad_norm": 0.4120002351387735,
|
|
"learning_rate": 2.3454348220771966e-05,
|
|
"loss": 0.1876,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1626529097557068,
|
|
"step": 2260,
|
|
"valid_targets_mean": 4942.2,
|
|
"valid_targets_min": 1938
|
|
},
|
|
{
|
|
"epoch": 3.511627906976744,
|
|
"grad_norm": 0.46155281185784397,
|
|
"learning_rate": 2.337816263988397e-05,
|
|
"loss": 0.1677,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2315581887960434,
|
|
"step": 2265,
|
|
"valid_targets_mean": 5495.6,
|
|
"valid_targets_min": 1092
|
|
},
|
|
{
|
|
"epoch": 3.5193798449612403,
|
|
"grad_norm": 0.4144849480419605,
|
|
"learning_rate": 2.3301926566583292e-05,
|
|
"loss": 0.1816,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.166578471660614,
|
|
"step": 2270,
|
|
"valid_targets_mean": 4457.1,
|
|
"valid_targets_min": 2280
|
|
},
|
|
{
|
|
"epoch": 3.5271317829457365,
|
|
"grad_norm": 0.4109601135912686,
|
|
"learning_rate": 2.3225641140348306e-05,
|
|
"loss": 0.1701,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17378325760364532,
|
|
"step": 2275,
|
|
"valid_targets_mean": 4608.7,
|
|
"valid_targets_min": 551
|
|
},
|
|
{
|
|
"epoch": 3.5348837209302326,
|
|
"grad_norm": 0.4582644976154119,
|
|
"learning_rate": 2.3149307501395056e-05,
|
|
"loss": 0.1446,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15773174166679382,
|
|
"step": 2280,
|
|
"valid_targets_mean": 4992.6,
|
|
"valid_targets_min": 740
|
|
},
|
|
{
|
|
"epoch": 3.5426356589147288,
|
|
"grad_norm": 0.46360151480816175,
|
|
"learning_rate": 2.3072926790660203e-05,
|
|
"loss": 0.1964,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20285546779632568,
|
|
"step": 2285,
|
|
"valid_targets_mean": 4078.0,
|
|
"valid_targets_min": 532
|
|
},
|
|
{
|
|
"epoch": 3.550387596899225,
|
|
"grad_norm": 0.4408826537960868,
|
|
"learning_rate": 2.2996500149783973e-05,
|
|
"loss": 0.1868,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13840195536613464,
|
|
"step": 2290,
|
|
"valid_targets_mean": 4301.3,
|
|
"valid_targets_min": 606
|
|
},
|
|
{
|
|
"epoch": 3.558139534883721,
|
|
"grad_norm": 0.41302173935323416,
|
|
"learning_rate": 2.292002872109309e-05,
|
|
"loss": 0.1806,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19090792536735535,
|
|
"step": 2295,
|
|
"valid_targets_mean": 4607.9,
|
|
"valid_targets_min": 1945
|
|
},
|
|
{
|
|
"epoch": 3.565891472868217,
|
|
"grad_norm": 0.48709929421908504,
|
|
"learning_rate": 2.284351364758373e-05,
|
|
"loss": 0.1747,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16162961721420288,
|
|
"step": 2300,
|
|
"valid_targets_mean": 2969.8,
|
|
"valid_targets_min": 411
|
|
},
|
|
{
|
|
"epoch": 3.5736434108527133,
|
|
"grad_norm": 0.34907911319518736,
|
|
"learning_rate": 2.2766956072904397e-05,
|
|
"loss": 0.1637,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16097891330718994,
|
|
"step": 2305,
|
|
"valid_targets_mean": 5617.7,
|
|
"valid_targets_min": 343
|
|
},
|
|
{
|
|
"epoch": 3.5813953488372094,
|
|
"grad_norm": 0.41643473859763513,
|
|
"learning_rate": 2.2690357141338853e-05,
|
|
"loss": 0.1923,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16287288069725037,
|
|
"step": 2310,
|
|
"valid_targets_mean": 4270.3,
|
|
"valid_targets_min": 1388
|
|
},
|
|
{
|
|
"epoch": 3.5891472868217056,
|
|
"grad_norm": 0.36847179752276477,
|
|
"learning_rate": 2.2613717997789016e-05,
|
|
"loss": 0.1762,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1488853245973587,
|
|
"step": 2315,
|
|
"valid_targets_mean": 4785.6,
|
|
"valid_targets_min": 661
|
|
},
|
|
{
|
|
"epoch": 3.5968992248062017,
|
|
"grad_norm": 0.41943679729107547,
|
|
"learning_rate": 2.2537039787757817e-05,
|
|
"loss": 0.1956,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19536623358726501,
|
|
"step": 2320,
|
|
"valid_targets_mean": 4583.6,
|
|
"valid_targets_min": 2379
|
|
},
|
|
{
|
|
"epoch": 3.604651162790698,
|
|
"grad_norm": 0.3773107032307372,
|
|
"learning_rate": 2.2460323657332138e-05,
|
|
"loss": 0.1756,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13412323594093323,
|
|
"step": 2325,
|
|
"valid_targets_mean": 4938.5,
|
|
"valid_targets_min": 766
|
|
},
|
|
{
|
|
"epoch": 3.612403100775194,
|
|
"grad_norm": 0.41099143457360815,
|
|
"learning_rate": 2.2383570753165615e-05,
|
|
"loss": 0.1752,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.146214097738266,
|
|
"step": 2330,
|
|
"valid_targets_mean": 4063.8,
|
|
"valid_targets_min": 520
|
|
},
|
|
{
|
|
"epoch": 3.62015503875969,
|
|
"grad_norm": 0.3494048218491353,
|
|
"learning_rate": 2.2306782222461547e-05,
|
|
"loss": 0.16,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1244577169418335,
|
|
"step": 2335,
|
|
"valid_targets_mean": 4674.1,
|
|
"valid_targets_min": 516
|
|
},
|
|
{
|
|
"epoch": 3.6279069767441863,
|
|
"grad_norm": 0.4137755237450408,
|
|
"learning_rate": 2.2229959212955735e-05,
|
|
"loss": 0.1557,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1691616028547287,
|
|
"step": 2340,
|
|
"valid_targets_mean": 4078.2,
|
|
"valid_targets_min": 957
|
|
},
|
|
{
|
|
"epoch": 3.6356589147286824,
|
|
"grad_norm": 0.41202438782783035,
|
|
"learning_rate": 2.2153102872899313e-05,
|
|
"loss": 0.181,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19243177771568298,
|
|
"step": 2345,
|
|
"valid_targets_mean": 5443.7,
|
|
"valid_targets_min": 684
|
|
},
|
|
{
|
|
"epoch": 3.6434108527131785,
|
|
"grad_norm": 0.4168252301471801,
|
|
"learning_rate": 2.20762143510416e-05,
|
|
"loss": 0.1601,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1762881577014923,
|
|
"step": 2350,
|
|
"valid_targets_mean": 4094.8,
|
|
"valid_targets_min": 436
|
|
},
|
|
{
|
|
"epoch": 3.6511627906976747,
|
|
"grad_norm": 0.3658382509380567,
|
|
"learning_rate": 2.1999294796612926e-05,
|
|
"loss": 0.1635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13929161429405212,
|
|
"step": 2355,
|
|
"valid_targets_mean": 5087.1,
|
|
"valid_targets_min": 2622
|
|
},
|
|
{
|
|
"epoch": 3.6589147286821704,
|
|
"grad_norm": 0.806554291125336,
|
|
"learning_rate": 2.1922345359307468e-05,
|
|
"loss": 0.1862,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24180075526237488,
|
|
"step": 2360,
|
|
"valid_targets_mean": 3961.2,
|
|
"valid_targets_min": 567
|
|
},
|
|
{
|
|
"epoch": 3.6666666666666665,
|
|
"grad_norm": 0.4010351294747989,
|
|
"learning_rate": 2.184536718926604e-05,
|
|
"loss": 0.1856,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15781967341899872,
|
|
"step": 2365,
|
|
"valid_targets_mean": 4302.3,
|
|
"valid_targets_min": 481
|
|
},
|
|
{
|
|
"epoch": 3.6744186046511627,
|
|
"grad_norm": 0.4910349746865378,
|
|
"learning_rate": 2.1768361437058924e-05,
|
|
"loss": 0.1822,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15803927183151245,
|
|
"step": 2370,
|
|
"valid_targets_mean": 5285.8,
|
|
"valid_targets_min": 1922
|
|
},
|
|
{
|
|
"epoch": 3.682170542635659,
|
|
"grad_norm": 0.5033930845464233,
|
|
"learning_rate": 2.1691329253668657e-05,
|
|
"loss": 0.1773,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16929282248020172,
|
|
"step": 2375,
|
|
"valid_targets_mean": 3518.6,
|
|
"valid_targets_min": 661
|
|
},
|
|
{
|
|
"epoch": 3.689922480620155,
|
|
"grad_norm": 0.4812536807942641,
|
|
"learning_rate": 2.1614271790472835e-05,
|
|
"loss": 0.1666,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16329653561115265,
|
|
"step": 2380,
|
|
"valid_targets_mean": 3963.1,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 3.697674418604651,
|
|
"grad_norm": 0.4106493741878364,
|
|
"learning_rate": 2.1537190199226917e-05,
|
|
"loss": 0.1822,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15833979845046997,
|
|
"step": 2385,
|
|
"valid_targets_mean": 4434.0,
|
|
"valid_targets_min": 678
|
|
},
|
|
{
|
|
"epoch": 3.705426356589147,
|
|
"grad_norm": 0.42703025254446647,
|
|
"learning_rate": 2.1460085632046983e-05,
|
|
"loss": 0.1842,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19955435395240784,
|
|
"step": 2390,
|
|
"valid_targets_mean": 4425.7,
|
|
"valid_targets_min": 268
|
|
},
|
|
{
|
|
"epoch": 3.7131782945736433,
|
|
"grad_norm": 0.3400275265721782,
|
|
"learning_rate": 2.138295924139253e-05,
|
|
"loss": 0.1584,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13872955739498138,
|
|
"step": 2395,
|
|
"valid_targets_mean": 5467.9,
|
|
"valid_targets_min": 319
|
|
},
|
|
{
|
|
"epoch": 3.7209302325581395,
|
|
"grad_norm": 0.3682059763421827,
|
|
"learning_rate": 2.1305812180049258e-05,
|
|
"loss": 0.1697,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14761081337928772,
|
|
"step": 2400,
|
|
"valid_targets_mean": 5667.8,
|
|
"valid_targets_min": 2894
|
|
},
|
|
{
|
|
"epoch": 3.7286821705426356,
|
|
"grad_norm": 0.3974454201846236,
|
|
"learning_rate": 2.12286456011118e-05,
|
|
"loss": 0.1629,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18874874711036682,
|
|
"step": 2405,
|
|
"valid_targets_mean": 5224.0,
|
|
"valid_targets_min": 3081
|
|
},
|
|
{
|
|
"epoch": 3.7364341085271318,
|
|
"grad_norm": 0.39427590403656537,
|
|
"learning_rate": 2.1151460657966543e-05,
|
|
"loss": 0.1731,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14733751118183136,
|
|
"step": 2410,
|
|
"valid_targets_mean": 4060.3,
|
|
"valid_targets_min": 2348
|
|
},
|
|
{
|
|
"epoch": 3.744186046511628,
|
|
"grad_norm": 0.4347000971418473,
|
|
"learning_rate": 2.1074258504274324e-05,
|
|
"loss": 0.1691,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16277927160263062,
|
|
"step": 2415,
|
|
"valid_targets_mean": 4161.8,
|
|
"valid_targets_min": 325
|
|
},
|
|
{
|
|
"epoch": 3.751937984496124,
|
|
"grad_norm": 0.46642613155184653,
|
|
"learning_rate": 2.099704029395325e-05,
|
|
"loss": 0.1635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17865529656410217,
|
|
"step": 2420,
|
|
"valid_targets_mean": 3506.7,
|
|
"valid_targets_min": 322
|
|
},
|
|
{
|
|
"epoch": 3.75968992248062,
|
|
"grad_norm": 0.36926786871608897,
|
|
"learning_rate": 2.0919807181161413e-05,
|
|
"loss": 0.182,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1872124969959259,
|
|
"step": 2425,
|
|
"valid_targets_mean": 5992.2,
|
|
"valid_targets_min": 2637
|
|
},
|
|
{
|
|
"epoch": 3.7674418604651163,
|
|
"grad_norm": 0.40797959752050406,
|
|
"learning_rate": 2.0842560320279647e-05,
|
|
"loss": 0.1795,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13483797013759613,
|
|
"step": 2430,
|
|
"valid_targets_mean": 3735.1,
|
|
"valid_targets_min": 396
|
|
},
|
|
{
|
|
"epoch": 3.7751937984496124,
|
|
"grad_norm": 0.3569093694297914,
|
|
"learning_rate": 2.0765300865894273e-05,
|
|
"loss": 0.1709,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16950270533561707,
|
|
"step": 2435,
|
|
"valid_targets_mean": 5004.4,
|
|
"valid_targets_min": 341
|
|
},
|
|
{
|
|
"epoch": 3.7829457364341086,
|
|
"grad_norm": 0.489744210232547,
|
|
"learning_rate": 2.068802997277984e-05,
|
|
"loss": 0.1676,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14903788268566132,
|
|
"step": 2440,
|
|
"valid_targets_mean": 4375.1,
|
|
"valid_targets_min": 613
|
|
},
|
|
{
|
|
"epoch": 3.7906976744186047,
|
|
"grad_norm": 0.4631630261801319,
|
|
"learning_rate": 2.061074879588187e-05,
|
|
"loss": 0.1761,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17495691776275635,
|
|
"step": 2445,
|
|
"valid_targets_mean": 4443.9,
|
|
"valid_targets_min": 2333
|
|
},
|
|
{
|
|
"epoch": 3.798449612403101,
|
|
"grad_norm": 0.381627105046557,
|
|
"learning_rate": 2.0533458490299608e-05,
|
|
"loss": 0.172,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19416113197803497,
|
|
"step": 2450,
|
|
"valid_targets_mean": 5910.8,
|
|
"valid_targets_min": 813
|
|
},
|
|
{
|
|
"epoch": 3.806201550387597,
|
|
"grad_norm": 0.3672369381288124,
|
|
"learning_rate": 2.0456160211268726e-05,
|
|
"loss": 0.1523,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15462546050548553,
|
|
"step": 2455,
|
|
"valid_targets_mean": 4590.2,
|
|
"valid_targets_min": 425
|
|
},
|
|
{
|
|
"epoch": 3.813953488372093,
|
|
"grad_norm": 0.36355092211128553,
|
|
"learning_rate": 2.037885511414408e-05,
|
|
"loss": 0.1685,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1489698588848114,
|
|
"step": 2460,
|
|
"valid_targets_mean": 4814.1,
|
|
"valid_targets_min": 250
|
|
},
|
|
{
|
|
"epoch": 3.8217054263565893,
|
|
"grad_norm": 0.5834913333456886,
|
|
"learning_rate": 2.030154435438243e-05,
|
|
"loss": 0.1806,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17469245195388794,
|
|
"step": 2465,
|
|
"valid_targets_mean": 4683.1,
|
|
"valid_targets_min": 227
|
|
},
|
|
{
|
|
"epoch": 3.8294573643410854,
|
|
"grad_norm": 0.3750569957368585,
|
|
"learning_rate": 2.0224229087525176e-05,
|
|
"loss": 0.1638,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16605322062969208,
|
|
"step": 2470,
|
|
"valid_targets_mean": 5050.2,
|
|
"valid_targets_min": 2206
|
|
},
|
|
{
|
|
"epoch": 3.8372093023255816,
|
|
"grad_norm": 0.4159111267532109,
|
|
"learning_rate": 2.0146910469181083e-05,
|
|
"loss": 0.1798,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16885146498680115,
|
|
"step": 2475,
|
|
"valid_targets_mean": 4601.3,
|
|
"valid_targets_min": 761
|
|
},
|
|
{
|
|
"epoch": 3.8449612403100772,
|
|
"grad_norm": 0.3729264179998901,
|
|
"learning_rate": 2.006958965500901e-05,
|
|
"loss": 0.1699,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15141122043132782,
|
|
"step": 2480,
|
|
"valid_targets_mean": 4849.9,
|
|
"valid_targets_min": 2352
|
|
},
|
|
{
|
|
"epoch": 3.8527131782945734,
|
|
"grad_norm": 0.5766276206946744,
|
|
"learning_rate": 1.9992267800700643e-05,
|
|
"loss": 0.1783,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19176653027534485,
|
|
"step": 2485,
|
|
"valid_targets_mean": 3846.1,
|
|
"valid_targets_min": 731
|
|
},
|
|
{
|
|
"epoch": 3.8604651162790695,
|
|
"grad_norm": 0.3706800726667539,
|
|
"learning_rate": 1.991494606196321e-05,
|
|
"loss": 0.1515,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1340998411178589,
|
|
"step": 2490,
|
|
"valid_targets_mean": 4474.6,
|
|
"valid_targets_min": 269
|
|
},
|
|
{
|
|
"epoch": 3.8682170542635657,
|
|
"grad_norm": 0.44584862226366007,
|
|
"learning_rate": 1.98376255945022e-05,
|
|
"loss": 0.1778,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16283494234085083,
|
|
"step": 2495,
|
|
"valid_targets_mean": 4311.2,
|
|
"valid_targets_min": 1115
|
|
},
|
|
{
|
|
"epoch": 3.875968992248062,
|
|
"grad_norm": 0.3592938976849822,
|
|
"learning_rate": 1.9760307554004122e-05,
|
|
"loss": 0.1524,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18098889291286469,
|
|
"step": 2500,
|
|
"valid_targets_mean": 5765.5,
|
|
"valid_targets_min": 528
|
|
},
|
|
{
|
|
"epoch": 3.883720930232558,
|
|
"grad_norm": 0.4223273599027322,
|
|
"learning_rate": 1.9682993096119197e-05,
|
|
"loss": 0.1693,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16485443711280823,
|
|
"step": 2505,
|
|
"valid_targets_mean": 4137.4,
|
|
"valid_targets_min": 901
|
|
},
|
|
{
|
|
"epoch": 3.891472868217054,
|
|
"grad_norm": 0.4448395910223574,
|
|
"learning_rate": 1.9605683376444086e-05,
|
|
"loss": 0.1817,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1999254673719406,
|
|
"step": 2510,
|
|
"valid_targets_mean": 3733.8,
|
|
"valid_targets_min": 266
|
|
},
|
|
{
|
|
"epoch": 3.89922480620155,
|
|
"grad_norm": 0.44711782753625473,
|
|
"learning_rate": 1.9528379550504663e-05,
|
|
"loss": 0.1975,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2123761773109436,
|
|
"step": 2515,
|
|
"valid_targets_mean": 3842.1,
|
|
"valid_targets_min": 489
|
|
},
|
|
{
|
|
"epoch": 3.9069767441860463,
|
|
"grad_norm": 0.3585629672419737,
|
|
"learning_rate": 1.945108277373869e-05,
|
|
"loss": 0.1668,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16551396250724792,
|
|
"step": 2520,
|
|
"valid_targets_mean": 5320.1,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 3.9147286821705425,
|
|
"grad_norm": 0.38593055920198166,
|
|
"learning_rate": 1.9373794201478554e-05,
|
|
"loss": 0.1681,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17138083279132843,
|
|
"step": 2525,
|
|
"valid_targets_mean": 4754.8,
|
|
"valid_targets_min": 325
|
|
},
|
|
{
|
|
"epoch": 3.9224806201550386,
|
|
"grad_norm": 0.34993836610858403,
|
|
"learning_rate": 1.9296514988934018e-05,
|
|
"loss": 0.1532,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13611240684986115,
|
|
"step": 2530,
|
|
"valid_targets_mean": 4849.8,
|
|
"valid_targets_min": 299
|
|
},
|
|
{
|
|
"epoch": 3.9302325581395348,
|
|
"grad_norm": 0.38998762581393137,
|
|
"learning_rate": 1.921924629117498e-05,
|
|
"loss": 0.169,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16259539127349854,
|
|
"step": 2535,
|
|
"valid_targets_mean": 4528.8,
|
|
"valid_targets_min": 1955
|
|
},
|
|
{
|
|
"epoch": 3.937984496124031,
|
|
"grad_norm": 0.4406751870739783,
|
|
"learning_rate": 1.9141989263114136e-05,
|
|
"loss": 0.185,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1572207659482956,
|
|
"step": 2540,
|
|
"valid_targets_mean": 3975.7,
|
|
"valid_targets_min": 709
|
|
},
|
|
{
|
|
"epoch": 3.945736434108527,
|
|
"grad_norm": 0.45031010235314506,
|
|
"learning_rate": 1.9064745059489774e-05,
|
|
"loss": 0.1841,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1765103042125702,
|
|
"step": 2545,
|
|
"valid_targets_mean": 3726.0,
|
|
"valid_targets_min": 282
|
|
},
|
|
{
|
|
"epoch": 3.953488372093023,
|
|
"grad_norm": 0.6078467791119643,
|
|
"learning_rate": 1.8987514834848503e-05,
|
|
"loss": 0.1611,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17429549992084503,
|
|
"step": 2550,
|
|
"valid_targets_mean": 3989.9,
|
|
"valid_targets_min": 685
|
|
},
|
|
{
|
|
"epoch": 3.9612403100775193,
|
|
"grad_norm": 0.3631710161577126,
|
|
"learning_rate": 1.8910299743527993e-05,
|
|
"loss": 0.1697,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1885673701763153,
|
|
"step": 2555,
|
|
"valid_targets_mean": 5834.6,
|
|
"valid_targets_min": 585
|
|
},
|
|
{
|
|
"epoch": 3.9689922480620154,
|
|
"grad_norm": 0.49167632435325864,
|
|
"learning_rate": 1.8833100939639694e-05,
|
|
"loss": 0.1624,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20458854734897614,
|
|
"step": 2560,
|
|
"valid_targets_mean": 3560.4,
|
|
"valid_targets_min": 419
|
|
},
|
|
{
|
|
"epoch": 3.9767441860465116,
|
|
"grad_norm": 0.3634420862575136,
|
|
"learning_rate": 1.875591957705166e-05,
|
|
"loss": 0.1785,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13289107382297516,
|
|
"step": 2565,
|
|
"valid_targets_mean": 5413.6,
|
|
"valid_targets_min": 1805
|
|
},
|
|
{
|
|
"epoch": 3.9844961240310077,
|
|
"grad_norm": 0.4586334241085507,
|
|
"learning_rate": 1.867875680937122e-05,
|
|
"loss": 0.1691,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2052847146987915,
|
|
"step": 2570,
|
|
"valid_targets_mean": 4061.1,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 3.992248062015504,
|
|
"grad_norm": 0.43210061293605817,
|
|
"learning_rate": 1.860161378992778e-05,
|
|
"loss": 0.1779,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2044166624546051,
|
|
"step": 2575,
|
|
"valid_targets_mean": 4605.4,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 4.0,
|
|
"grad_norm": 0.37276933625985337,
|
|
"learning_rate": 1.8524491671755563e-05,
|
|
"loss": 0.1763,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1616727113723755,
|
|
"step": 2580,
|
|
"valid_targets_mean": 5067.4,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 4.007751937984496,
|
|
"grad_norm": 0.36563074448629657,
|
|
"learning_rate": 1.8447391607576416e-05,
|
|
"loss": 0.1441,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13933786749839783,
|
|
"step": 2585,
|
|
"valid_targets_mean": 4913.7,
|
|
"valid_targets_min": 740
|
|
},
|
|
{
|
|
"epoch": 4.015503875968992,
|
|
"grad_norm": 0.4772926288066321,
|
|
"learning_rate": 1.8370314749782524e-05,
|
|
"loss": 0.1581,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18599829077720642,
|
|
"step": 2590,
|
|
"valid_targets_mean": 4072.6,
|
|
"valid_targets_min": 666
|
|
},
|
|
{
|
|
"epoch": 4.023255813953488,
|
|
"grad_norm": 0.4964995939447069,
|
|
"learning_rate": 1.8293262250419215e-05,
|
|
"loss": 0.165,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16809843480587006,
|
|
"step": 2595,
|
|
"valid_targets_mean": 3508.6,
|
|
"valid_targets_min": 2368
|
|
},
|
|
{
|
|
"epoch": 4.0310077519379846,
|
|
"grad_norm": 0.5174597685405774,
|
|
"learning_rate": 1.8216235261167765e-05,
|
|
"loss": 0.1731,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2505348324775696,
|
|
"step": 2600,
|
|
"valid_targets_mean": 4262.7,
|
|
"valid_targets_min": 970
|
|
},
|
|
{
|
|
"epoch": 4.038759689922481,
|
|
"grad_norm": 0.40606990941323745,
|
|
"learning_rate": 1.8139234933328126e-05,
|
|
"loss": 0.1677,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.138991117477417,
|
|
"step": 2605,
|
|
"valid_targets_mean": 5074.9,
|
|
"valid_targets_min": 680
|
|
},
|
|
{
|
|
"epoch": 4.046511627906977,
|
|
"grad_norm": 0.4634993018273127,
|
|
"learning_rate": 1.8062262417801767e-05,
|
|
"loss": 0.1539,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1454424411058426,
|
|
"step": 2610,
|
|
"valid_targets_mean": 4132.0,
|
|
"valid_targets_min": 315
|
|
},
|
|
{
|
|
"epoch": 4.054263565891473,
|
|
"grad_norm": 0.45594388080755227,
|
|
"learning_rate": 1.7985318865074445e-05,
|
|
"loss": 0.1558,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13495397567749023,
|
|
"step": 2615,
|
|
"valid_targets_mean": 4592.6,
|
|
"valid_targets_min": 908
|
|
},
|
|
{
|
|
"epoch": 4.062015503875969,
|
|
"grad_norm": 0.3632193067972436,
|
|
"learning_rate": 1.790840542519903e-05,
|
|
"loss": 0.1581,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14542677998542786,
|
|
"step": 2620,
|
|
"valid_targets_mean": 6443.2,
|
|
"valid_targets_min": 674
|
|
},
|
|
{
|
|
"epoch": 4.069767441860465,
|
|
"grad_norm": 0.4084216853540113,
|
|
"learning_rate": 1.7831523247778296e-05,
|
|
"loss": 0.1361,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15561866760253906,
|
|
"step": 2625,
|
|
"valid_targets_mean": 4696.6,
|
|
"valid_targets_min": 669
|
|
},
|
|
{
|
|
"epoch": 4.077519379844961,
|
|
"grad_norm": 0.4622453535570728,
|
|
"learning_rate": 1.775467348194774e-05,
|
|
"loss": 0.1508,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1541646271944046,
|
|
"step": 2630,
|
|
"valid_targets_mean": 4509.7,
|
|
"valid_targets_min": 585
|
|
},
|
|
{
|
|
"epoch": 4.0852713178294575,
|
|
"grad_norm": 0.36481781559899207,
|
|
"learning_rate": 1.767785727635843e-05,
|
|
"loss": 0.1445,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1567380130290985,
|
|
"step": 2635,
|
|
"valid_targets_mean": 6221.8,
|
|
"valid_targets_min": 761
|
|
},
|
|
{
|
|
"epoch": 4.093023255813954,
|
|
"grad_norm": 0.3792078104165168,
|
|
"learning_rate": 1.7601075779159806e-05,
|
|
"loss": 0.1463,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12530960142612457,
|
|
"step": 2640,
|
|
"valid_targets_mean": 4478.4,
|
|
"valid_targets_min": 361
|
|
},
|
|
{
|
|
"epoch": 4.10077519379845,
|
|
"grad_norm": 0.4219019340853787,
|
|
"learning_rate": 1.7524330137982524e-05,
|
|
"loss": 0.1563,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18058227002620697,
|
|
"step": 2645,
|
|
"valid_targets_mean": 4726.9,
|
|
"valid_targets_min": 2654
|
|
},
|
|
{
|
|
"epoch": 4.108527131782946,
|
|
"grad_norm": 0.42766284883408445,
|
|
"learning_rate": 1.7447621499921342e-05,
|
|
"loss": 0.1555,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16935157775878906,
|
|
"step": 2650,
|
|
"valid_targets_mean": 4662.6,
|
|
"valid_targets_min": 2874
|
|
},
|
|
{
|
|
"epoch": 4.116279069767442,
|
|
"grad_norm": 0.4480590715700904,
|
|
"learning_rate": 1.7370951011517906e-05,
|
|
"loss": 0.159,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19573025405406952,
|
|
"step": 2655,
|
|
"valid_targets_mean": 4988.3,
|
|
"valid_targets_min": 887
|
|
},
|
|
{
|
|
"epoch": 4.124031007751938,
|
|
"grad_norm": 0.4647682503763762,
|
|
"learning_rate": 1.7294319818743677e-05,
|
|
"loss": 0.1599,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1806863695383072,
|
|
"step": 2660,
|
|
"valid_targets_mean": 4018.7,
|
|
"valid_targets_min": 684
|
|
},
|
|
{
|
|
"epoch": 4.131782945736434,
|
|
"grad_norm": 0.33468042082332256,
|
|
"learning_rate": 1.7217729066982754e-05,
|
|
"loss": 0.1676,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13625994324684143,
|
|
"step": 2665,
|
|
"valid_targets_mean": 5762.8,
|
|
"valid_targets_min": 3241
|
|
},
|
|
{
|
|
"epoch": 4.1395348837209305,
|
|
"grad_norm": 0.35879066729195264,
|
|
"learning_rate": 1.7141179901014798e-05,
|
|
"loss": 0.151,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1351138949394226,
|
|
"step": 2670,
|
|
"valid_targets_mean": 5373.6,
|
|
"valid_targets_min": 2492
|
|
},
|
|
{
|
|
"epoch": 4.147286821705427,
|
|
"grad_norm": 0.38289139539979355,
|
|
"learning_rate": 1.7064673464997885e-05,
|
|
"loss": 0.1507,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14373061060905457,
|
|
"step": 2675,
|
|
"valid_targets_mean": 4701.4,
|
|
"valid_targets_min": 1523
|
|
},
|
|
{
|
|
"epoch": 4.155038759689923,
|
|
"grad_norm": 0.3514618484402962,
|
|
"learning_rate": 1.698821090245141e-05,
|
|
"loss": 0.1576,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12618312239646912,
|
|
"step": 2680,
|
|
"valid_targets_mean": 5099.0,
|
|
"valid_targets_min": 1436
|
|
},
|
|
{
|
|
"epoch": 4.162790697674419,
|
|
"grad_norm": 0.4029673695317988,
|
|
"learning_rate": 1.691179335623904e-05,
|
|
"loss": 0.151,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15906205773353577,
|
|
"step": 2685,
|
|
"valid_targets_mean": 5508.1,
|
|
"valid_targets_min": 432
|
|
},
|
|
{
|
|
"epoch": 4.170542635658915,
|
|
"grad_norm": 0.4944425640026309,
|
|
"learning_rate": 1.6835421968551556e-05,
|
|
"loss": 0.1478,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14945298433303833,
|
|
"step": 2690,
|
|
"valid_targets_mean": 3783.1,
|
|
"valid_targets_min": 770
|
|
},
|
|
{
|
|
"epoch": 4.178294573643411,
|
|
"grad_norm": 0.4380361387817116,
|
|
"learning_rate": 1.675909788088984e-05,
|
|
"loss": 0.1737,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18563194572925568,
|
|
"step": 2695,
|
|
"valid_targets_mean": 4740.7,
|
|
"valid_targets_min": 2335
|
|
},
|
|
{
|
|
"epoch": 4.186046511627907,
|
|
"grad_norm": 0.4771028211600623,
|
|
"learning_rate": 1.6682822234047796e-05,
|
|
"loss": 0.1555,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1575438231229782,
|
|
"step": 2700,
|
|
"valid_targets_mean": 3456.6,
|
|
"valid_targets_min": 352
|
|
},
|
|
{
|
|
"epoch": 4.1937984496124034,
|
|
"grad_norm": 0.41423182041175527,
|
|
"learning_rate": 1.660659616809529e-05,
|
|
"loss": 0.1599,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13387396931648254,
|
|
"step": 2705,
|
|
"valid_targets_mean": 4664.9,
|
|
"valid_targets_min": 1948
|
|
},
|
|
{
|
|
"epoch": 4.2015503875969,
|
|
"grad_norm": 0.530813584525465,
|
|
"learning_rate": 1.653042082236112e-05,
|
|
"loss": 0.1774,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3004525601863861,
|
|
"step": 2710,
|
|
"valid_targets_mean": 4756.2,
|
|
"valid_targets_min": 332
|
|
},
|
|
{
|
|
"epoch": 4.209302325581396,
|
|
"grad_norm": 0.44640047447531017,
|
|
"learning_rate": 1.6454297335415975e-05,
|
|
"loss": 0.167,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1683686077594757,
|
|
"step": 2715,
|
|
"valid_targets_mean": 3983.3,
|
|
"valid_targets_min": 558
|
|
},
|
|
{
|
|
"epoch": 4.217054263565892,
|
|
"grad_norm": 0.4231137236979658,
|
|
"learning_rate": 1.6378226845055454e-05,
|
|
"loss": 0.1657,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17019568383693695,
|
|
"step": 2720,
|
|
"valid_targets_mean": 4835.2,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 4.224806201550388,
|
|
"grad_norm": 0.386736159227142,
|
|
"learning_rate": 1.6302210488282993e-05,
|
|
"loss": 0.1633,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18334552645683289,
|
|
"step": 2725,
|
|
"valid_targets_mean": 5246.4,
|
|
"valid_targets_min": 479
|
|
},
|
|
{
|
|
"epoch": 4.232558139534884,
|
|
"grad_norm": 0.4229332730901514,
|
|
"learning_rate": 1.6226249401292932e-05,
|
|
"loss": 0.1447,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1335538774728775,
|
|
"step": 2730,
|
|
"valid_targets_mean": 4478.2,
|
|
"valid_targets_min": 265
|
|
},
|
|
{
|
|
"epoch": 4.24031007751938,
|
|
"grad_norm": 0.5239959011141749,
|
|
"learning_rate": 1.6150344719453513e-05,
|
|
"loss": 0.1599,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13435792922973633,
|
|
"step": 2735,
|
|
"valid_targets_mean": 4364.5,
|
|
"valid_targets_min": 389
|
|
},
|
|
{
|
|
"epoch": 4.248062015503876,
|
|
"grad_norm": 0.3585379143026963,
|
|
"learning_rate": 1.6074497577289893e-05,
|
|
"loss": 0.1428,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12283202260732651,
|
|
"step": 2740,
|
|
"valid_targets_mean": 5174.9,
|
|
"valid_targets_min": 2143
|
|
},
|
|
{
|
|
"epoch": 4.2558139534883725,
|
|
"grad_norm": 0.41779854478657813,
|
|
"learning_rate": 1.599870910846721e-05,
|
|
"loss": 0.1634,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13781797885894775,
|
|
"step": 2745,
|
|
"valid_targets_mean": 4340.5,
|
|
"valid_targets_min": 2348
|
|
},
|
|
{
|
|
"epoch": 4.263565891472869,
|
|
"grad_norm": 0.47639510138543717,
|
|
"learning_rate": 1.5922980445773618e-05,
|
|
"loss": 0.1688,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20977307856082916,
|
|
"step": 2750,
|
|
"valid_targets_mean": 4089.1,
|
|
"valid_targets_min": 570
|
|
},
|
|
{
|
|
"epoch": 4.271317829457364,
|
|
"grad_norm": 0.4321321807850601,
|
|
"learning_rate": 1.584731272110338e-05,
|
|
"loss": 0.1478,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1279362142086029,
|
|
"step": 2755,
|
|
"valid_targets_mean": 4232.4,
|
|
"valid_targets_min": 661
|
|
},
|
|
{
|
|
"epoch": 4.27906976744186,
|
|
"grad_norm": 0.4163782737967656,
|
|
"learning_rate": 1.5771707065439925e-05,
|
|
"loss": 0.1586,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1572471261024475,
|
|
"step": 2760,
|
|
"valid_targets_mean": 4172.6,
|
|
"valid_targets_min": 362
|
|
},
|
|
{
|
|
"epoch": 4.286821705426356,
|
|
"grad_norm": 0.44476929142723237,
|
|
"learning_rate": 1.5696164608838957e-05,
|
|
"loss": 0.1492,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12877783179283142,
|
|
"step": 2765,
|
|
"valid_targets_mean": 3667.2,
|
|
"valid_targets_min": 324
|
|
},
|
|
{
|
|
"epoch": 4.294573643410852,
|
|
"grad_norm": 0.44033521779323154,
|
|
"learning_rate": 1.5620686480411568e-05,
|
|
"loss": 0.1793,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1912871152162552,
|
|
"step": 2770,
|
|
"valid_targets_mean": 4556.9,
|
|
"valid_targets_min": 571
|
|
},
|
|
{
|
|
"epoch": 4.3023255813953485,
|
|
"grad_norm": 0.43835417771534674,
|
|
"learning_rate": 1.5545273808307358e-05,
|
|
"loss": 0.1762,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18065080046653748,
|
|
"step": 2775,
|
|
"valid_targets_mean": 4829.0,
|
|
"valid_targets_min": 701
|
|
},
|
|
{
|
|
"epoch": 4.310077519379845,
|
|
"grad_norm": 0.4359801265972791,
|
|
"learning_rate": 1.546992771969755e-05,
|
|
"loss": 0.1548,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1816236674785614,
|
|
"step": 2780,
|
|
"valid_targets_mean": 4372.9,
|
|
"valid_targets_min": 313
|
|
},
|
|
{
|
|
"epoch": 4.317829457364341,
|
|
"grad_norm": 0.4410756401612138,
|
|
"learning_rate": 1.5394649340758184e-05,
|
|
"loss": 0.1483,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15419849753379822,
|
|
"step": 2785,
|
|
"valid_targets_mean": 5035.1,
|
|
"valid_targets_min": 2134
|
|
},
|
|
{
|
|
"epoch": 4.325581395348837,
|
|
"grad_norm": 0.4559093303470707,
|
|
"learning_rate": 1.5319439796653258e-05,
|
|
"loss": 0.1586,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17408901453018188,
|
|
"step": 2790,
|
|
"valid_targets_mean": 4336.3,
|
|
"valid_targets_min": 1990
|
|
},
|
|
{
|
|
"epoch": 4.333333333333333,
|
|
"grad_norm": 0.3733614937743712,
|
|
"learning_rate": 1.5244300211517916e-05,
|
|
"loss": 0.1613,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1421089917421341,
|
|
"step": 2795,
|
|
"valid_targets_mean": 4486.0,
|
|
"valid_targets_min": 266
|
|
},
|
|
{
|
|
"epoch": 4.341085271317829,
|
|
"grad_norm": 0.4384718248610877,
|
|
"learning_rate": 1.5169231708441625e-05,
|
|
"loss": 0.1641,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15485528111457825,
|
|
"step": 2800,
|
|
"valid_targets_mean": 4390.1,
|
|
"valid_targets_min": 458
|
|
},
|
|
{
|
|
"epoch": 4.348837209302325,
|
|
"grad_norm": 0.35486111522759517,
|
|
"learning_rate": 1.5094235409451452e-05,
|
|
"loss": 0.1567,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14936892688274384,
|
|
"step": 2805,
|
|
"valid_targets_mean": 5619.9,
|
|
"valid_targets_min": 2606
|
|
},
|
|
{
|
|
"epoch": 4.3565891472868215,
|
|
"grad_norm": 0.4641264262776539,
|
|
"learning_rate": 1.5019312435495215e-05,
|
|
"loss": 0.1681,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16389770805835724,
|
|
"step": 2810,
|
|
"valid_targets_mean": 4543.3,
|
|
"valid_targets_min": 531
|
|
},
|
|
{
|
|
"epoch": 4.364341085271318,
|
|
"grad_norm": 0.4095733450935873,
|
|
"learning_rate": 1.4944463906424773e-05,
|
|
"loss": 0.1602,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15087318420410156,
|
|
"step": 2815,
|
|
"valid_targets_mean": 5138.6,
|
|
"valid_targets_min": 2324
|
|
},
|
|
{
|
|
"epoch": 4.372093023255814,
|
|
"grad_norm": 0.43224144450256036,
|
|
"learning_rate": 1.486969094097929e-05,
|
|
"loss": 0.1864,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17015056312084198,
|
|
"step": 2820,
|
|
"valid_targets_mean": 4383.4,
|
|
"valid_targets_min": 196
|
|
},
|
|
{
|
|
"epoch": 4.37984496124031,
|
|
"grad_norm": 0.42039391089480094,
|
|
"learning_rate": 1.4794994656768485e-05,
|
|
"loss": 0.1835,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16320443153381348,
|
|
"step": 2825,
|
|
"valid_targets_mean": 4572.7,
|
|
"valid_targets_min": 1677
|
|
},
|
|
{
|
|
"epoch": 4.387596899224806,
|
|
"grad_norm": 0.4360528678353131,
|
|
"learning_rate": 1.4720376170255958e-05,
|
|
"loss": 0.1631,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17029808461666107,
|
|
"step": 2830,
|
|
"valid_targets_mean": 4660.2,
|
|
"valid_targets_min": 2294
|
|
},
|
|
{
|
|
"epoch": 4.395348837209302,
|
|
"grad_norm": 0.47146218786067823,
|
|
"learning_rate": 1.464583659674248e-05,
|
|
"loss": 0.1666,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19265028834342957,
|
|
"step": 2835,
|
|
"valid_targets_mean": 4134.2,
|
|
"valid_targets_min": 328
|
|
},
|
|
{
|
|
"epoch": 4.403100775193798,
|
|
"grad_norm": 0.44499692816713254,
|
|
"learning_rate": 1.4571377050349347e-05,
|
|
"loss": 0.1577,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16304971277713776,
|
|
"step": 2840,
|
|
"valid_targets_mean": 4391.5,
|
|
"valid_targets_min": 370
|
|
},
|
|
{
|
|
"epoch": 4.410852713178294,
|
|
"grad_norm": 0.46432590434836263,
|
|
"learning_rate": 1.44969986440017e-05,
|
|
"loss": 0.1707,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1540422886610031,
|
|
"step": 2845,
|
|
"valid_targets_mean": 4667.3,
|
|
"valid_targets_min": 335
|
|
},
|
|
{
|
|
"epoch": 4.4186046511627906,
|
|
"grad_norm": 0.4999077483071989,
|
|
"learning_rate": 1.4422702489411894e-05,
|
|
"loss": 0.162,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18639114499092102,
|
|
"step": 2850,
|
|
"valid_targets_mean": 3962.9,
|
|
"valid_targets_min": 546
|
|
},
|
|
{
|
|
"epoch": 4.426356589147287,
|
|
"grad_norm": 0.405932784042207,
|
|
"learning_rate": 1.4348489697062925e-05,
|
|
"loss": 0.1603,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1444004476070404,
|
|
"step": 2855,
|
|
"valid_targets_mean": 4650.3,
|
|
"valid_targets_min": 1526
|
|
},
|
|
{
|
|
"epoch": 4.434108527131783,
|
|
"grad_norm": 0.3934528365825335,
|
|
"learning_rate": 1.4274361376191767e-05,
|
|
"loss": 0.1516,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1553172767162323,
|
|
"step": 2860,
|
|
"valid_targets_mean": 5694.0,
|
|
"valid_targets_min": 2890
|
|
},
|
|
{
|
|
"epoch": 4.441860465116279,
|
|
"grad_norm": 0.40913794771831696,
|
|
"learning_rate": 1.420031863477283e-05,
|
|
"loss": 0.1581,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1494569182395935,
|
|
"step": 2865,
|
|
"valid_targets_mean": 4331.6,
|
|
"valid_targets_min": 319
|
|
},
|
|
{
|
|
"epoch": 4.449612403100775,
|
|
"grad_norm": 0.47285700783628626,
|
|
"learning_rate": 1.4126362579501401e-05,
|
|
"loss": 0.1612,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15232403576374054,
|
|
"step": 2870,
|
|
"valid_targets_mean": 3542.6,
|
|
"valid_targets_min": 370
|
|
},
|
|
{
|
|
"epoch": 4.457364341085271,
|
|
"grad_norm": 0.4650848027329248,
|
|
"learning_rate": 1.4052494315777091e-05,
|
|
"loss": 0.1726,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1610431671142578,
|
|
"step": 2875,
|
|
"valid_targets_mean": 3635.2,
|
|
"valid_targets_min": 1079
|
|
},
|
|
{
|
|
"epoch": 4.465116279069767,
|
|
"grad_norm": 0.4653775809202961,
|
|
"learning_rate": 1.3978714947687308e-05,
|
|
"loss": 0.158,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20595189929008484,
|
|
"step": 2880,
|
|
"valid_targets_mean": 4235.9,
|
|
"valid_targets_min": 453
|
|
},
|
|
{
|
|
"epoch": 4.4728682170542635,
|
|
"grad_norm": 0.3856889005381559,
|
|
"learning_rate": 1.390502557799077e-05,
|
|
"loss": 0.1645,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14087346196174622,
|
|
"step": 2885,
|
|
"valid_targets_mean": 4527.4,
|
|
"valid_targets_min": 2189
|
|
},
|
|
{
|
|
"epoch": 4.48062015503876,
|
|
"grad_norm": 0.3945151120253326,
|
|
"learning_rate": 1.3831427308101021e-05,
|
|
"loss": 0.1623,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1581602394580841,
|
|
"step": 2890,
|
|
"valid_targets_mean": 4957.9,
|
|
"valid_targets_min": 1819
|
|
},
|
|
{
|
|
"epoch": 4.488372093023256,
|
|
"grad_norm": 0.40342280135663167,
|
|
"learning_rate": 1.375792123806996e-05,
|
|
"loss": 0.1669,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14058300852775574,
|
|
"step": 2895,
|
|
"valid_targets_mean": 4725.2,
|
|
"valid_targets_min": 643
|
|
},
|
|
{
|
|
"epoch": 4.496124031007752,
|
|
"grad_norm": 0.4036139924740885,
|
|
"learning_rate": 1.3684508466571385e-05,
|
|
"loss": 0.1639,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18375971913337708,
|
|
"step": 2900,
|
|
"valid_targets_mean": 5136.7,
|
|
"valid_targets_min": 536
|
|
},
|
|
{
|
|
"epoch": 4.503875968992248,
|
|
"grad_norm": 0.5271710172062103,
|
|
"learning_rate": 1.3611190090884611e-05,
|
|
"loss": 0.1606,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17250756919384003,
|
|
"step": 2905,
|
|
"valid_targets_mean": 3673.4,
|
|
"valid_targets_min": 249
|
|
},
|
|
{
|
|
"epoch": 4.511627906976744,
|
|
"grad_norm": 0.40659265968531066,
|
|
"learning_rate": 1.3537967206878036e-05,
|
|
"loss": 0.1541,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15408380329608917,
|
|
"step": 2910,
|
|
"valid_targets_mean": 4791.4,
|
|
"valid_targets_min": 869
|
|
},
|
|
{
|
|
"epoch": 4.51937984496124,
|
|
"grad_norm": 0.3722111335904797,
|
|
"learning_rate": 1.3464840908992768e-05,
|
|
"loss": 0.1553,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12856316566467285,
|
|
"step": 2915,
|
|
"valid_targets_mean": 4795.7,
|
|
"valid_targets_min": 2420
|
|
},
|
|
{
|
|
"epoch": 4.5271317829457365,
|
|
"grad_norm": 0.4556137521413307,
|
|
"learning_rate": 1.3391812290226272e-05,
|
|
"loss": 0.187,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2201414704322815,
|
|
"step": 2920,
|
|
"valid_targets_mean": 4536.7,
|
|
"valid_targets_min": 694
|
|
},
|
|
{
|
|
"epoch": 4.534883720930233,
|
|
"grad_norm": 0.4743449244975186,
|
|
"learning_rate": 1.3318882442116048e-05,
|
|
"loss": 0.1578,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21773910522460938,
|
|
"step": 2925,
|
|
"valid_targets_mean": 4512.2,
|
|
"valid_targets_min": 581
|
|
},
|
|
{
|
|
"epoch": 4.542635658914729,
|
|
"grad_norm": 0.47202078789113744,
|
|
"learning_rate": 1.3246052454723275e-05,
|
|
"loss": 0.1484,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17931053042411804,
|
|
"step": 2930,
|
|
"valid_targets_mean": 4000.9,
|
|
"valid_targets_min": 683
|
|
},
|
|
{
|
|
"epoch": 4.550387596899225,
|
|
"grad_norm": 0.363075525223068,
|
|
"learning_rate": 1.3173323416616546e-05,
|
|
"loss": 0.1634,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1436081826686859,
|
|
"step": 2935,
|
|
"valid_targets_mean": 5052.1,
|
|
"valid_targets_min": 766
|
|
},
|
|
{
|
|
"epoch": 4.558139534883721,
|
|
"grad_norm": 0.4252120402864096,
|
|
"learning_rate": 1.310069641485562e-05,
|
|
"loss": 0.163,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1449616551399231,
|
|
"step": 2940,
|
|
"valid_targets_mean": 5067.6,
|
|
"valid_targets_min": 968
|
|
},
|
|
{
|
|
"epoch": 4.565891472868217,
|
|
"grad_norm": 0.41309349051810224,
|
|
"learning_rate": 1.3028172534975125e-05,
|
|
"loss": 0.1589,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15337392687797546,
|
|
"step": 2945,
|
|
"valid_targets_mean": 4410.0,
|
|
"valid_targets_min": 625
|
|
},
|
|
{
|
|
"epoch": 4.573643410852713,
|
|
"grad_norm": 0.5160731043484095,
|
|
"learning_rate": 1.2955752860968356e-05,
|
|
"loss": 0.1697,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1839904487133026,
|
|
"step": 2950,
|
|
"valid_targets_mean": 4195.2,
|
|
"valid_targets_min": 1004
|
|
},
|
|
{
|
|
"epoch": 4.5813953488372094,
|
|
"grad_norm": 0.39603413769839324,
|
|
"learning_rate": 1.2883438475271088e-05,
|
|
"loss": 0.1449,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1449984461069107,
|
|
"step": 2955,
|
|
"valid_targets_mean": 4908.1,
|
|
"valid_targets_min": 1489
|
|
},
|
|
{
|
|
"epoch": 4.589147286821706,
|
|
"grad_norm": 0.4659985680055713,
|
|
"learning_rate": 1.2811230458745372e-05,
|
|
"loss": 0.1748,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21567106246948242,
|
|
"step": 2960,
|
|
"valid_targets_mean": 4454.5,
|
|
"valid_targets_min": 665
|
|
},
|
|
{
|
|
"epoch": 4.596899224806202,
|
|
"grad_norm": 0.4523280898732182,
|
|
"learning_rate": 1.2739129890663386e-05,
|
|
"loss": 0.1546,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15529918670654297,
|
|
"step": 2965,
|
|
"valid_targets_mean": 4419.5,
|
|
"valid_targets_min": 962
|
|
},
|
|
{
|
|
"epoch": 4.604651162790698,
|
|
"grad_norm": 0.3913593277889339,
|
|
"learning_rate": 1.266713784869131e-05,
|
|
"loss": 0.1801,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15807433426380157,
|
|
"step": 2970,
|
|
"valid_targets_mean": 4846.1,
|
|
"valid_targets_min": 734
|
|
},
|
|
{
|
|
"epoch": 4.612403100775194,
|
|
"grad_norm": 0.4182683219376584,
|
|
"learning_rate": 1.2595255408873232e-05,
|
|
"loss": 0.1507,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13988031446933746,
|
|
"step": 2975,
|
|
"valid_targets_mean": 4320.1,
|
|
"valid_targets_min": 523
|
|
},
|
|
{
|
|
"epoch": 4.62015503875969,
|
|
"grad_norm": 0.35362147101841246,
|
|
"learning_rate": 1.2523483645615031e-05,
|
|
"loss": 0.1435,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11566026508808136,
|
|
"step": 2980,
|
|
"valid_targets_mean": 5738.1,
|
|
"valid_targets_min": 1805
|
|
},
|
|
{
|
|
"epoch": 4.627906976744186,
|
|
"grad_norm": 0.4359085932620926,
|
|
"learning_rate": 1.2451823631668333e-05,
|
|
"loss": 0.1734,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2180645763874054,
|
|
"step": 2985,
|
|
"valid_targets_mean": 5415.4,
|
|
"valid_targets_min": 1779
|
|
},
|
|
{
|
|
"epoch": 4.635658914728682,
|
|
"grad_norm": 0.4178432880182616,
|
|
"learning_rate": 1.2380276438114495e-05,
|
|
"loss": 0.1635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15357699990272522,
|
|
"step": 2990,
|
|
"valid_targets_mean": 3995.6,
|
|
"valid_targets_min": 921
|
|
},
|
|
{
|
|
"epoch": 4.6434108527131785,
|
|
"grad_norm": 0.3928742323402058,
|
|
"learning_rate": 1.2308843134348569e-05,
|
|
"loss": 0.1587,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14658121764659882,
|
|
"step": 2995,
|
|
"valid_targets_mean": 4797.7,
|
|
"valid_targets_min": 808
|
|
},
|
|
{
|
|
"epoch": 4.651162790697675,
|
|
"grad_norm": 0.40724671685704517,
|
|
"learning_rate": 1.2237524788063335e-05,
|
|
"loss": 0.1494,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13327175378799438,
|
|
"step": 3000,
|
|
"valid_targets_mean": 4289.8,
|
|
"valid_targets_min": 654
|
|
},
|
|
{
|
|
"epoch": 4.658914728682171,
|
|
"grad_norm": 0.38017870244977436,
|
|
"learning_rate": 1.2166322465233325e-05,
|
|
"loss": 0.1552,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15827676653862,
|
|
"step": 3005,
|
|
"valid_targets_mean": 5934.4,
|
|
"valid_targets_min": 2154
|
|
},
|
|
{
|
|
"epoch": 4.666666666666667,
|
|
"grad_norm": 0.4241213390458187,
|
|
"learning_rate": 1.2095237230098925e-05,
|
|
"loss": 0.1513,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15015850961208344,
|
|
"step": 3010,
|
|
"valid_targets_mean": 3942.2,
|
|
"valid_targets_min": 2726
|
|
},
|
|
{
|
|
"epoch": 4.674418604651163,
|
|
"grad_norm": 0.42983747059070593,
|
|
"learning_rate": 1.2024270145150428e-05,
|
|
"loss": 0.1529,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1613459587097168,
|
|
"step": 3015,
|
|
"valid_targets_mean": 4662.0,
|
|
"valid_targets_min": 2112
|
|
},
|
|
{
|
|
"epoch": 4.682170542635659,
|
|
"grad_norm": 0.4541648568256799,
|
|
"learning_rate": 1.1953422271112171e-05,
|
|
"loss": 0.1533,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1784931868314743,
|
|
"step": 3020,
|
|
"valid_targets_mean": 4353.8,
|
|
"valid_targets_min": 682
|
|
},
|
|
{
|
|
"epoch": 4.689922480620155,
|
|
"grad_norm": 0.37376376389283156,
|
|
"learning_rate": 1.1882694666926691e-05,
|
|
"loss": 0.1458,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10884034633636475,
|
|
"step": 3025,
|
|
"valid_targets_mean": 4409.1,
|
|
"valid_targets_min": 533
|
|
},
|
|
{
|
|
"epoch": 4.6976744186046515,
|
|
"grad_norm": 0.4214595584685805,
|
|
"learning_rate": 1.1812088389738875e-05,
|
|
"loss": 0.1558,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21922525763511658,
|
|
"step": 3030,
|
|
"valid_targets_mean": 6067.9,
|
|
"valid_targets_min": 797
|
|
},
|
|
{
|
|
"epoch": 4.705426356589148,
|
|
"grad_norm": 0.35642720118665594,
|
|
"learning_rate": 1.1741604494880177e-05,
|
|
"loss": 0.151,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14536528289318085,
|
|
"step": 3035,
|
|
"valid_targets_mean": 5993.4,
|
|
"valid_targets_min": 752
|
|
},
|
|
{
|
|
"epoch": 4.713178294573644,
|
|
"grad_norm": 0.4788498710665514,
|
|
"learning_rate": 1.167124403585283e-05,
|
|
"loss": 0.1607,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16465994715690613,
|
|
"step": 3040,
|
|
"valid_targets_mean": 3857.6,
|
|
"valid_targets_min": 302
|
|
},
|
|
{
|
|
"epoch": 4.720930232558139,
|
|
"grad_norm": 0.46807401286424594,
|
|
"learning_rate": 1.1601008064314127e-05,
|
|
"loss": 0.1511,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17980757355690002,
|
|
"step": 3045,
|
|
"valid_targets_mean": 4050.8,
|
|
"valid_targets_min": 411
|
|
},
|
|
{
|
|
"epoch": 4.728682170542635,
|
|
"grad_norm": 0.3493024998293867,
|
|
"learning_rate": 1.1530897630060664e-05,
|
|
"loss": 0.1453,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14402084052562714,
|
|
"step": 3050,
|
|
"valid_targets_mean": 5970.5,
|
|
"valid_targets_min": 3312
|
|
},
|
|
{
|
|
"epoch": 4.736434108527131,
|
|
"grad_norm": 1.1433311286570027,
|
|
"learning_rate": 1.146091378101267e-05,
|
|
"loss": 0.1612,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18359369039535522,
|
|
"step": 3055,
|
|
"valid_targets_mean": 5394.9,
|
|
"valid_targets_min": 2047
|
|
},
|
|
{
|
|
"epoch": 4.7441860465116275,
|
|
"grad_norm": 0.3656089625075003,
|
|
"learning_rate": 1.1391057563198352e-05,
|
|
"loss": 0.1568,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15548282861709595,
|
|
"step": 3060,
|
|
"valid_targets_mean": 5395.7,
|
|
"valid_targets_min": 1999
|
|
},
|
|
{
|
|
"epoch": 4.751937984496124,
|
|
"grad_norm": 0.3682957712457608,
|
|
"learning_rate": 1.1321330020738238e-05,
|
|
"loss": 0.1513,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12282656878232956,
|
|
"step": 3065,
|
|
"valid_targets_mean": 4505.5,
|
|
"valid_targets_min": 433
|
|
},
|
|
{
|
|
"epoch": 4.75968992248062,
|
|
"grad_norm": 0.41853152057960064,
|
|
"learning_rate": 1.1251732195829581e-05,
|
|
"loss": 0.1611,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13153740763664246,
|
|
"step": 3070,
|
|
"valid_targets_mean": 4470.2,
|
|
"valid_targets_min": 2352
|
|
},
|
|
{
|
|
"epoch": 4.767441860465116,
|
|
"grad_norm": 0.38423534152358596,
|
|
"learning_rate": 1.118226512873081e-05,
|
|
"loss": 0.1537,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17503979802131653,
|
|
"step": 3075,
|
|
"valid_targets_mean": 4954.4,
|
|
"valid_targets_min": 307
|
|
},
|
|
{
|
|
"epoch": 4.775193798449612,
|
|
"grad_norm": 0.37157618329698217,
|
|
"learning_rate": 1.1112929857745924e-05,
|
|
"loss": 0.1463,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13206711411476135,
|
|
"step": 3080,
|
|
"valid_targets_mean": 5568.5,
|
|
"valid_targets_min": 2292
|
|
},
|
|
{
|
|
"epoch": 4.782945736434108,
|
|
"grad_norm": 0.509246178657668,
|
|
"learning_rate": 1.1043727419209023e-05,
|
|
"loss": 0.1653,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1961718052625656,
|
|
"step": 3085,
|
|
"valid_targets_mean": 3839.4,
|
|
"valid_targets_min": 266
|
|
},
|
|
{
|
|
"epoch": 4.790697674418604,
|
|
"grad_norm": 0.4608884016393757,
|
|
"learning_rate": 1.0974658847468775e-05,
|
|
"loss": 0.1639,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18118709325790405,
|
|
"step": 3090,
|
|
"valid_targets_mean": 4658.3,
|
|
"valid_targets_min": 609
|
|
},
|
|
{
|
|
"epoch": 4.7984496124031,
|
|
"grad_norm": 0.3407586601849243,
|
|
"learning_rate": 1.0905725174873021e-05,
|
|
"loss": 0.1508,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13145892322063446,
|
|
"step": 3095,
|
|
"valid_targets_mean": 5481.1,
|
|
"valid_targets_min": 2463
|
|
},
|
|
{
|
|
"epoch": 4.8062015503875966,
|
|
"grad_norm": 0.44372721977998414,
|
|
"learning_rate": 1.0836927431753268e-05,
|
|
"loss": 0.1535,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1747463047504425,
|
|
"step": 3100,
|
|
"valid_targets_mean": 4381.4,
|
|
"valid_targets_min": 2634
|
|
},
|
|
{
|
|
"epoch": 4.813953488372093,
|
|
"grad_norm": 0.4313480237295467,
|
|
"learning_rate": 1.0768266646409331e-05,
|
|
"loss": 0.1725,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1479579210281372,
|
|
"step": 3105,
|
|
"valid_targets_mean": 3838.2,
|
|
"valid_targets_min": 558
|
|
},
|
|
{
|
|
"epoch": 4.821705426356589,
|
|
"grad_norm": 0.40712005319072236,
|
|
"learning_rate": 1.0699743845093977e-05,
|
|
"loss": 0.1807,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16829770803451538,
|
|
"step": 3110,
|
|
"valid_targets_mean": 5049.5,
|
|
"valid_targets_min": 635
|
|
},
|
|
{
|
|
"epoch": 4.829457364341085,
|
|
"grad_norm": 0.4038620874534929,
|
|
"learning_rate": 1.0631360051997545e-05,
|
|
"loss": 0.1504,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13558568060398102,
|
|
"step": 3115,
|
|
"valid_targets_mean": 4396.6,
|
|
"valid_targets_min": 477
|
|
},
|
|
{
|
|
"epoch": 4.837209302325581,
|
|
"grad_norm": 0.46074509090856464,
|
|
"learning_rate": 1.0563116289232664e-05,
|
|
"loss": 0.1389,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13045081496238708,
|
|
"step": 3120,
|
|
"valid_targets_mean": 3530.9,
|
|
"valid_targets_min": 341
|
|
},
|
|
{
|
|
"epoch": 4.844961240310077,
|
|
"grad_norm": 0.43813490790924364,
|
|
"learning_rate": 1.0495013576818974e-05,
|
|
"loss": 0.1585,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15511000156402588,
|
|
"step": 3125,
|
|
"valid_targets_mean": 4225.4,
|
|
"valid_targets_min": 670
|
|
},
|
|
{
|
|
"epoch": 4.852713178294573,
|
|
"grad_norm": 0.4380047569329961,
|
|
"learning_rate": 1.0427052932667872e-05,
|
|
"loss": 0.1729,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19142797589302063,
|
|
"step": 3130,
|
|
"valid_targets_mean": 4649.4,
|
|
"valid_targets_min": 1866
|
|
},
|
|
{
|
|
"epoch": 4.8604651162790695,
|
|
"grad_norm": 0.3622958483592568,
|
|
"learning_rate": 1.0359235372567303e-05,
|
|
"loss": 0.1564,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16687515377998352,
|
|
"step": 3135,
|
|
"valid_targets_mean": 5099.6,
|
|
"valid_targets_min": 2400
|
|
},
|
|
{
|
|
"epoch": 4.868217054263566,
|
|
"grad_norm": 0.4538324825468118,
|
|
"learning_rate": 1.0291561910166575e-05,
|
|
"loss": 0.1508,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1640026718378067,
|
|
"step": 3140,
|
|
"valid_targets_mean": 4020.4,
|
|
"valid_targets_min": 637
|
|
},
|
|
{
|
|
"epoch": 4.875968992248062,
|
|
"grad_norm": 0.3815270313643839,
|
|
"learning_rate": 1.0224033556961221e-05,
|
|
"loss": 0.1517,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15679693222045898,
|
|
"step": 3145,
|
|
"valid_targets_mean": 5416.8,
|
|
"valid_targets_min": 2731
|
|
},
|
|
{
|
|
"epoch": 4.883720930232558,
|
|
"grad_norm": 0.37173879163162826,
|
|
"learning_rate": 1.0156651322277859e-05,
|
|
"loss": 0.1545,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15583065152168274,
|
|
"step": 3150,
|
|
"valid_targets_mean": 6000.7,
|
|
"valid_targets_min": 2168
|
|
},
|
|
{
|
|
"epoch": 4.891472868217054,
|
|
"grad_norm": 0.44542528707551793,
|
|
"learning_rate": 1.0089416213259109e-05,
|
|
"loss": 0.1655,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2258930504322052,
|
|
"step": 3155,
|
|
"valid_targets_mean": 5374.3,
|
|
"valid_targets_min": 1335
|
|
},
|
|
{
|
|
"epoch": 4.89922480620155,
|
|
"grad_norm": 0.46872132575511044,
|
|
"learning_rate": 1.0022329234848568e-05,
|
|
"loss": 0.1745,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20413146913051605,
|
|
"step": 3160,
|
|
"valid_targets_mean": 4518.1,
|
|
"valid_targets_min": 1923
|
|
},
|
|
{
|
|
"epoch": 4.906976744186046,
|
|
"grad_norm": 0.4064894961029224,
|
|
"learning_rate": 9.95539138977575e-06,
|
|
"loss": 0.1493,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12033580243587494,
|
|
"step": 3165,
|
|
"valid_targets_mean": 4383.8,
|
|
"valid_targets_min": 606
|
|
},
|
|
{
|
|
"epoch": 4.9147286821705425,
|
|
"grad_norm": 0.3163430136720968,
|
|
"learning_rate": 9.88860367854112e-06,
|
|
"loss": 0.1449,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14553579688072205,
|
|
"step": 3170,
|
|
"valid_targets_mean": 7166.2,
|
|
"valid_targets_min": 3325
|
|
},
|
|
{
|
|
"epoch": 4.922480620155039,
|
|
"grad_norm": 0.38091013274436497,
|
|
"learning_rate": 9.821967099401137e-06,
|
|
"loss": 0.1657,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1597091257572174,
|
|
"step": 3175,
|
|
"valid_targets_mean": 5441.1,
|
|
"valid_targets_min": 1887
|
|
},
|
|
{
|
|
"epoch": 4.930232558139535,
|
|
"grad_norm": 0.34441694300189507,
|
|
"learning_rate": 9.755482648353335e-06,
|
|
"loss": 0.1646,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13708937168121338,
|
|
"step": 3180,
|
|
"valid_targets_mean": 5538.1,
|
|
"valid_targets_min": 2859
|
|
},
|
|
{
|
|
"epoch": 4.937984496124031,
|
|
"grad_norm": 0.37415077897828763,
|
|
"learning_rate": 9.689151319121433e-06,
|
|
"loss": 0.1629,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14037328958511353,
|
|
"step": 3185,
|
|
"valid_targets_mean": 5194.1,
|
|
"valid_targets_min": 2266
|
|
},
|
|
{
|
|
"epoch": 4.945736434108527,
|
|
"grad_norm": 0.44777782502419616,
|
|
"learning_rate": 9.62297410314047e-06,
|
|
"loss": 0.1678,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18096795678138733,
|
|
"step": 3190,
|
|
"valid_targets_mean": 4345.2,
|
|
"valid_targets_min": 750
|
|
},
|
|
{
|
|
"epoch": 4.953488372093023,
|
|
"grad_norm": 0.38931181856536856,
|
|
"learning_rate": 9.556951989542032e-06,
|
|
"loss": 0.1541,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11744767427444458,
|
|
"step": 3195,
|
|
"valid_targets_mean": 4002.5,
|
|
"valid_targets_min": 462
|
|
},
|
|
{
|
|
"epoch": 4.961240310077519,
|
|
"grad_norm": 0.36948872010681133,
|
|
"learning_rate": 9.491085965139402e-06,
|
|
"loss": 0.1516,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12257242947816849,
|
|
"step": 3200,
|
|
"valid_targets_mean": 5256.6,
|
|
"valid_targets_min": 611
|
|
},
|
|
{
|
|
"epoch": 4.9689922480620154,
|
|
"grad_norm": 0.41347264041909937,
|
|
"learning_rate": 9.425377014412848e-06,
|
|
"loss": 0.1556,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15283584594726562,
|
|
"step": 3205,
|
|
"valid_targets_mean": 4368.1,
|
|
"valid_targets_min": 891
|
|
},
|
|
{
|
|
"epoch": 4.976744186046512,
|
|
"grad_norm": 0.42750383797473995,
|
|
"learning_rate": 9.35982611949493e-06,
|
|
"loss": 0.1725,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18603989481925964,
|
|
"step": 3210,
|
|
"valid_targets_mean": 4814.5,
|
|
"valid_targets_min": 483
|
|
},
|
|
{
|
|
"epoch": 4.984496124031008,
|
|
"grad_norm": 0.43059647799726375,
|
|
"learning_rate": 9.294434260155765e-06,
|
|
"loss": 0.161,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22478413581848145,
|
|
"step": 3215,
|
|
"valid_targets_mean": 5452.1,
|
|
"valid_targets_min": 1531
|
|
},
|
|
{
|
|
"epoch": 4.992248062015504,
|
|
"grad_norm": 0.39768354831373554,
|
|
"learning_rate": 9.229202413788419e-06,
|
|
"loss": 0.1745,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15155833959579468,
|
|
"step": 3220,
|
|
"valid_targets_mean": 4607.6,
|
|
"valid_targets_min": 2135
|
|
},
|
|
{
|
|
"epoch": 5.0,
|
|
"grad_norm": 0.38185972751001357,
|
|
"learning_rate": 9.164131555394288e-06,
|
|
"loss": 0.1561,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13077522814273834,
|
|
"step": 3225,
|
|
"valid_targets_mean": 4259.6,
|
|
"valid_targets_min": 380
|
|
},
|
|
{
|
|
"epoch": 5.007751937984496,
|
|
"grad_norm": 0.41906475146843863,
|
|
"learning_rate": 9.099222657568554e-06,
|
|
"loss": 0.1557,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15627771615982056,
|
|
"step": 3230,
|
|
"valid_targets_mean": 5040.4,
|
|
"valid_targets_min": 1940
|
|
},
|
|
{
|
|
"epoch": 5.015503875968992,
|
|
"grad_norm": 0.4052151818524859,
|
|
"learning_rate": 9.034476690485579e-06,
|
|
"loss": 0.1328,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13936452567577362,
|
|
"step": 3235,
|
|
"valid_targets_mean": 5023.8,
|
|
"valid_targets_min": 705
|
|
},
|
|
{
|
|
"epoch": 5.023255813953488,
|
|
"grad_norm": 0.37188613632576223,
|
|
"learning_rate": 8.969894621884467e-06,
|
|
"loss": 0.1426,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12986522912979126,
|
|
"step": 3240,
|
|
"valid_targets_mean": 5463.1,
|
|
"valid_targets_min": 412
|
|
},
|
|
{
|
|
"epoch": 5.0310077519379846,
|
|
"grad_norm": 0.3919445371842698,
|
|
"learning_rate": 8.905477417054595e-06,
|
|
"loss": 0.1387,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12915056943893433,
|
|
"step": 3245,
|
|
"valid_targets_mean": 5352.3,
|
|
"valid_targets_min": 2354
|
|
},
|
|
{
|
|
"epoch": 5.038759689922481,
|
|
"grad_norm": 0.40240515277621475,
|
|
"learning_rate": 8.841226038821147e-06,
|
|
"loss": 0.1414,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1427655816078186,
|
|
"step": 3250,
|
|
"valid_targets_mean": 4806.9,
|
|
"valid_targets_min": 927
|
|
},
|
|
{
|
|
"epoch": 5.046511627906977,
|
|
"grad_norm": 0.4482311614474207,
|
|
"learning_rate": 8.77714144753075e-06,
|
|
"loss": 0.1335,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1503133922815323,
|
|
"step": 3255,
|
|
"valid_targets_mean": 4343.8,
|
|
"valid_targets_min": 188
|
|
},
|
|
{
|
|
"epoch": 5.054263565891473,
|
|
"grad_norm": 0.41632602975114186,
|
|
"learning_rate": 8.713224601037116e-06,
|
|
"loss": 0.1424,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11666247993707657,
|
|
"step": 3260,
|
|
"valid_targets_mean": 3756.2,
|
|
"valid_targets_min": 412
|
|
},
|
|
{
|
|
"epoch": 5.062015503875969,
|
|
"grad_norm": 0.4421325070582108,
|
|
"learning_rate": 8.649476454686734e-06,
|
|
"loss": 0.1549,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14591653645038605,
|
|
"step": 3265,
|
|
"valid_targets_mean": 4298.9,
|
|
"valid_targets_min": 2252
|
|
},
|
|
{
|
|
"epoch": 5.069767441860465,
|
|
"grad_norm": 0.3706889070551245,
|
|
"learning_rate": 8.58589796130457e-06,
|
|
"loss": 0.1448,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1363983452320099,
|
|
"step": 3270,
|
|
"valid_targets_mean": 5321.2,
|
|
"valid_targets_min": 435
|
|
},
|
|
{
|
|
"epoch": 5.077519379844961,
|
|
"grad_norm": 0.42292771021367553,
|
|
"learning_rate": 8.522490071179834e-06,
|
|
"loss": 0.1654,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1678886115550995,
|
|
"step": 3275,
|
|
"valid_targets_mean": 4751.9,
|
|
"valid_targets_min": 610
|
|
},
|
|
{
|
|
"epoch": 5.0852713178294575,
|
|
"grad_norm": 0.5828499776845351,
|
|
"learning_rate": 8.459253732051793e-06,
|
|
"loss": 0.1661,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17978990077972412,
|
|
"step": 3280,
|
|
"valid_targets_mean": 4170.8,
|
|
"valid_targets_min": 267
|
|
},
|
|
{
|
|
"epoch": 5.093023255813954,
|
|
"grad_norm": 0.4615372722971231,
|
|
"learning_rate": 8.396189889095581e-06,
|
|
"loss": 0.1516,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18241898715496063,
|
|
"step": 3285,
|
|
"valid_targets_mean": 4325.0,
|
|
"valid_targets_min": 1860
|
|
},
|
|
{
|
|
"epoch": 5.10077519379845,
|
|
"grad_norm": 0.3817650649549942,
|
|
"learning_rate": 8.333299484908081e-06,
|
|
"loss": 0.1368,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1241084486246109,
|
|
"step": 3290,
|
|
"valid_targets_mean": 4798.9,
|
|
"valid_targets_min": 670
|
|
},
|
|
{
|
|
"epoch": 5.108527131782946,
|
|
"grad_norm": 0.4194147503687341,
|
|
"learning_rate": 8.27058345949384e-06,
|
|
"loss": 0.1484,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14202088117599487,
|
|
"step": 3295,
|
|
"valid_targets_mean": 4392.2,
|
|
"valid_targets_min": 1724
|
|
},
|
|
{
|
|
"epoch": 5.116279069767442,
|
|
"grad_norm": 0.38881934176704125,
|
|
"learning_rate": 8.208042750251017e-06,
|
|
"loss": 0.1428,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12283352017402649,
|
|
"step": 3300,
|
|
"valid_targets_mean": 5001.8,
|
|
"valid_targets_min": 860
|
|
},
|
|
{
|
|
"epoch": 5.124031007751938,
|
|
"grad_norm": 0.41598556767284195,
|
|
"learning_rate": 8.14567829195737e-06,
|
|
"loss": 0.1498,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12442460656166077,
|
|
"step": 3305,
|
|
"valid_targets_mean": 4178.7,
|
|
"valid_targets_min": 1866
|
|
},
|
|
{
|
|
"epoch": 5.131782945736434,
|
|
"grad_norm": 0.5128407487191675,
|
|
"learning_rate": 8.083491016756282e-06,
|
|
"loss": 0.1501,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17859122157096863,
|
|
"step": 3310,
|
|
"valid_targets_mean": 3686.2,
|
|
"valid_targets_min": 761
|
|
},
|
|
{
|
|
"epoch": 5.1395348837209305,
|
|
"grad_norm": 0.3758183019008081,
|
|
"learning_rate": 8.021481854142843e-06,
|
|
"loss": 0.1487,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14447617530822754,
|
|
"step": 3315,
|
|
"valid_targets_mean": 5073.4,
|
|
"valid_targets_min": 1295
|
|
},
|
|
{
|
|
"epoch": 5.147286821705427,
|
|
"grad_norm": 0.47801726631549907,
|
|
"learning_rate": 7.959651730949938e-06,
|
|
"loss": 0.14,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1533583104610443,
|
|
"step": 3320,
|
|
"valid_targets_mean": 3810.4,
|
|
"valid_targets_min": 688
|
|
},
|
|
{
|
|
"epoch": 5.155038759689923,
|
|
"grad_norm": 0.3860929841594393,
|
|
"learning_rate": 7.898001571334393e-06,
|
|
"loss": 0.148,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14451035857200623,
|
|
"step": 3325,
|
|
"valid_targets_mean": 5514.4,
|
|
"valid_targets_min": 587
|
|
},
|
|
{
|
|
"epoch": 5.162790697674419,
|
|
"grad_norm": 0.3927336266773621,
|
|
"learning_rate": 7.836532296763195e-06,
|
|
"loss": 0.15,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14219003915786743,
|
|
"step": 3330,
|
|
"valid_targets_mean": 5720.4,
|
|
"valid_targets_min": 854
|
|
},
|
|
{
|
|
"epoch": 5.170542635658915,
|
|
"grad_norm": 0.4701871029698711,
|
|
"learning_rate": 7.775244825999674e-06,
|
|
"loss": 0.1506,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13866694271564484,
|
|
"step": 3335,
|
|
"valid_targets_mean": 4240.4,
|
|
"valid_targets_min": 327
|
|
},
|
|
{
|
|
"epoch": 5.178294573643411,
|
|
"grad_norm": 0.5611394213445632,
|
|
"learning_rate": 7.7141400750898e-06,
|
|
"loss": 0.1537,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1594468057155609,
|
|
"step": 3340,
|
|
"valid_targets_mean": 3598.9,
|
|
"valid_targets_min": 332
|
|
},
|
|
{
|
|
"epoch": 5.186046511627907,
|
|
"grad_norm": 0.46697871764537624,
|
|
"learning_rate": 7.653218957348478e-06,
|
|
"loss": 0.1625,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17361919581890106,
|
|
"step": 3345,
|
|
"valid_targets_mean": 4588.7,
|
|
"valid_targets_min": 750
|
|
},
|
|
{
|
|
"epoch": 5.1937984496124034,
|
|
"grad_norm": 0.40704733172155627,
|
|
"learning_rate": 7.592482383345905e-06,
|
|
"loss": 0.1715,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16594815254211426,
|
|
"step": 3350,
|
|
"valid_targets_mean": 5162.1,
|
|
"valid_targets_min": 2503
|
|
},
|
|
{
|
|
"epoch": 5.2015503875969,
|
|
"grad_norm": 0.43347382037931187,
|
|
"learning_rate": 7.531931260893956e-06,
|
|
"loss": 0.1481,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12546521425247192,
|
|
"step": 3355,
|
|
"valid_targets_mean": 4259.8,
|
|
"valid_targets_min": 2493
|
|
},
|
|
{
|
|
"epoch": 5.209302325581396,
|
|
"grad_norm": 0.451832191981657,
|
|
"learning_rate": 7.47156649503261e-06,
|
|
"loss": 0.1444,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14870810508728027,
|
|
"step": 3360,
|
|
"valid_targets_mean": 4736.9,
|
|
"valid_targets_min": 2527
|
|
},
|
|
{
|
|
"epoch": 5.217054263565892,
|
|
"grad_norm": 0.5092134368319543,
|
|
"learning_rate": 7.411388988016444e-06,
|
|
"loss": 0.1464,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18897545337677002,
|
|
"step": 3365,
|
|
"valid_targets_mean": 4291.3,
|
|
"valid_targets_min": 1979
|
|
},
|
|
{
|
|
"epoch": 5.224806201550388,
|
|
"grad_norm": 0.3992712621608886,
|
|
"learning_rate": 7.351399639301116e-06,
|
|
"loss": 0.1433,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16864998638629913,
|
|
"step": 3370,
|
|
"valid_targets_mean": 5468.9,
|
|
"valid_targets_min": 2411
|
|
},
|
|
{
|
|
"epoch": 5.232558139534884,
|
|
"grad_norm": 0.43818725229100414,
|
|
"learning_rate": 7.291599345529936e-06,
|
|
"loss": 0.1517,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14088185131549835,
|
|
"step": 3375,
|
|
"valid_targets_mean": 4397.0,
|
|
"valid_targets_min": 227
|
|
},
|
|
{
|
|
"epoch": 5.24031007751938,
|
|
"grad_norm": 0.42669853677221803,
|
|
"learning_rate": 7.231989000520485e-06,
|
|
"loss": 0.1637,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16974776983261108,
|
|
"step": 3380,
|
|
"valid_targets_mean": 5304.2,
|
|
"valid_targets_min": 818
|
|
},
|
|
{
|
|
"epoch": 5.248062015503876,
|
|
"grad_norm": 0.42231966887434225,
|
|
"learning_rate": 7.172569495251214e-06,
|
|
"loss": 0.1525,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15044859051704407,
|
|
"step": 3385,
|
|
"valid_targets_mean": 4793.6,
|
|
"valid_targets_min": 893
|
|
},
|
|
{
|
|
"epoch": 5.2558139534883725,
|
|
"grad_norm": 0.3774758090043144,
|
|
"learning_rate": 7.113341717848154e-06,
|
|
"loss": 0.1478,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14274142682552338,
|
|
"step": 3390,
|
|
"valid_targets_mean": 5430.0,
|
|
"valid_targets_min": 567
|
|
},
|
|
{
|
|
"epoch": 5.263565891472869,
|
|
"grad_norm": 0.4221322079184396,
|
|
"learning_rate": 7.05430655357163e-06,
|
|
"loss": 0.1356,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1326403170824051,
|
|
"step": 3395,
|
|
"valid_targets_mean": 4851.8,
|
|
"valid_targets_min": 1855
|
|
},
|
|
{
|
|
"epoch": 5.271317829457364,
|
|
"grad_norm": 0.41865340457663663,
|
|
"learning_rate": 6.995464884803056e-06,
|
|
"loss": 0.1605,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15016970038414001,
|
|
"step": 3400,
|
|
"valid_targets_mean": 4839.2,
|
|
"valid_targets_min": 685
|
|
},
|
|
{
|
|
"epoch": 5.27906976744186,
|
|
"grad_norm": 0.37620910591252854,
|
|
"learning_rate": 6.936817591031704e-06,
|
|
"loss": 0.1553,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11961726099252701,
|
|
"step": 3405,
|
|
"valid_targets_mean": 5236.1,
|
|
"valid_targets_min": 263
|
|
},
|
|
{
|
|
"epoch": 5.286821705426356,
|
|
"grad_norm": 0.41396399132639294,
|
|
"learning_rate": 6.878365548841583e-06,
|
|
"loss": 0.1667,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15676863491535187,
|
|
"step": 3410,
|
|
"valid_targets_mean": 5105.6,
|
|
"valid_targets_min": 434
|
|
},
|
|
{
|
|
"epoch": 5.294573643410852,
|
|
"grad_norm": 0.37430857448740984,
|
|
"learning_rate": 6.820109631898337e-06,
|
|
"loss": 0.1537,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13516280055046082,
|
|
"step": 3415,
|
|
"valid_targets_mean": 5407.8,
|
|
"valid_targets_min": 361
|
|
},
|
|
{
|
|
"epoch": 5.3023255813953485,
|
|
"grad_norm": 0.39609033417068207,
|
|
"learning_rate": 6.7620507109361876e-06,
|
|
"loss": 0.1416,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11794918775558472,
|
|
"step": 3420,
|
|
"valid_targets_mean": 4567.0,
|
|
"valid_targets_min": 770
|
|
},
|
|
{
|
|
"epoch": 5.310077519379845,
|
|
"grad_norm": 0.6118599264333754,
|
|
"learning_rate": 6.704189653744897e-06,
|
|
"loss": 0.1615,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1839725375175476,
|
|
"step": 3425,
|
|
"valid_targets_mean": 4516.2,
|
|
"valid_targets_min": 484
|
|
},
|
|
{
|
|
"epoch": 5.317829457364341,
|
|
"grad_norm": 0.4381562079932628,
|
|
"learning_rate": 6.646527325156842e-06,
|
|
"loss": 0.1412,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16818967461585999,
|
|
"step": 3430,
|
|
"valid_targets_mean": 4886.8,
|
|
"valid_targets_min": 420
|
|
},
|
|
{
|
|
"epoch": 5.325581395348837,
|
|
"grad_norm": 0.4226204361999147,
|
|
"learning_rate": 6.5890645870340445e-06,
|
|
"loss": 0.1548,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1639600247144699,
|
|
"step": 3435,
|
|
"valid_targets_mean": 5103.1,
|
|
"valid_targets_min": 696
|
|
},
|
|
{
|
|
"epoch": 5.333333333333333,
|
|
"grad_norm": 0.3710849263141366,
|
|
"learning_rate": 6.531802298255303e-06,
|
|
"loss": 0.1499,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12949195504188538,
|
|
"step": 3440,
|
|
"valid_targets_mean": 4989.1,
|
|
"valid_targets_min": 2837
|
|
},
|
|
{
|
|
"epoch": 5.341085271317829,
|
|
"grad_norm": 0.4435129156035455,
|
|
"learning_rate": 6.474741314703359e-06,
|
|
"loss": 0.1478,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15639318525791168,
|
|
"step": 3445,
|
|
"valid_targets_mean": 4721.8,
|
|
"valid_targets_min": 617
|
|
},
|
|
{
|
|
"epoch": 5.348837209302325,
|
|
"grad_norm": 0.3625818524554749,
|
|
"learning_rate": 6.417882489252123e-06,
|
|
"loss": 0.1402,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12721361219882965,
|
|
"step": 3450,
|
|
"valid_targets_mean": 5639.6,
|
|
"valid_targets_min": 3016
|
|
},
|
|
{
|
|
"epoch": 5.3565891472868215,
|
|
"grad_norm": 0.4323434478569545,
|
|
"learning_rate": 6.361226671753881e-06,
|
|
"loss": 0.1493,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1502252072095871,
|
|
"step": 3455,
|
|
"valid_targets_mean": 5072.4,
|
|
"valid_targets_min": 346
|
|
},
|
|
{
|
|
"epoch": 5.364341085271318,
|
|
"grad_norm": 0.37196863493668914,
|
|
"learning_rate": 6.304774709026633e-06,
|
|
"loss": 0.1474,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12962721288204193,
|
|
"step": 3460,
|
|
"valid_targets_mean": 5211.2,
|
|
"valid_targets_min": 2412
|
|
},
|
|
{
|
|
"epoch": 5.372093023255814,
|
|
"grad_norm": 0.4392929005011265,
|
|
"learning_rate": 6.248527444841417e-06,
|
|
"loss": 0.1469,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15446701645851135,
|
|
"step": 3465,
|
|
"valid_targets_mean": 4372.7,
|
|
"valid_targets_min": 2320
|
|
},
|
|
{
|
|
"epoch": 5.37984496124031,
|
|
"grad_norm": 0.45498046007325976,
|
|
"learning_rate": 6.1924857199097e-06,
|
|
"loss": 0.1653,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1651144027709961,
|
|
"step": 3470,
|
|
"valid_targets_mean": 4883.4,
|
|
"valid_targets_min": 936
|
|
},
|
|
{
|
|
"epoch": 5.387596899224806,
|
|
"grad_norm": 0.42317989191246896,
|
|
"learning_rate": 6.136650371870816e-06,
|
|
"loss": 0.1391,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12391775101423264,
|
|
"step": 3475,
|
|
"valid_targets_mean": 6439.6,
|
|
"valid_targets_min": 2368
|
|
},
|
|
{
|
|
"epoch": 5.395348837209302,
|
|
"grad_norm": 0.4440482712927205,
|
|
"learning_rate": 6.081022235279439e-06,
|
|
"loss": 0.1509,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13077440857887268,
|
|
"step": 3480,
|
|
"valid_targets_mean": 4186.4,
|
|
"valid_targets_min": 2293
|
|
},
|
|
{
|
|
"epoch": 5.403100775193798,
|
|
"grad_norm": 0.45472821818832726,
|
|
"learning_rate": 6.025602141593128e-06,
|
|
"loss": 0.1387,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13112467527389526,
|
|
"step": 3485,
|
|
"valid_targets_mean": 4406.1,
|
|
"valid_targets_min": 454
|
|
},
|
|
{
|
|
"epoch": 5.410852713178294,
|
|
"grad_norm": 0.3962937912503978,
|
|
"learning_rate": 5.970390919159872e-06,
|
|
"loss": 0.1493,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16544798016548157,
|
|
"step": 3490,
|
|
"valid_targets_mean": 5308.0,
|
|
"valid_targets_min": 797
|
|
},
|
|
{
|
|
"epoch": 5.4186046511627906,
|
|
"grad_norm": 0.3643941673945403,
|
|
"learning_rate": 5.915389393205717e-06,
|
|
"loss": 0.1608,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11564834415912628,
|
|
"step": 3495,
|
|
"valid_targets_mean": 4933.6,
|
|
"valid_targets_min": 573
|
|
},
|
|
{
|
|
"epoch": 5.426356589147287,
|
|
"grad_norm": 0.42998784565296494,
|
|
"learning_rate": 5.86059838582246e-06,
|
|
"loss": 0.1413,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15233772993087769,
|
|
"step": 3500,
|
|
"valid_targets_mean": 4981.4,
|
|
"valid_targets_min": 269
|
|
},
|
|
{
|
|
"epoch": 5.434108527131783,
|
|
"grad_norm": 0.41822740876158127,
|
|
"learning_rate": 5.806018715955317e-06,
|
|
"loss": 0.1449,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1299438178539276,
|
|
"step": 3505,
|
|
"valid_targets_mean": 4537.4,
|
|
"valid_targets_min": 1080
|
|
},
|
|
{
|
|
"epoch": 5.441860465116279,
|
|
"grad_norm": 0.4528399940397294,
|
|
"learning_rate": 5.751651199390704e-06,
|
|
"loss": 0.1558,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16579484939575195,
|
|
"step": 3510,
|
|
"valid_targets_mean": 4755.4,
|
|
"valid_targets_min": 2776
|
|
},
|
|
{
|
|
"epoch": 5.449612403100775,
|
|
"grad_norm": 0.4684592080080512,
|
|
"learning_rate": 5.697496648744063e-06,
|
|
"loss": 0.1353,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.143550843000412,
|
|
"step": 3515,
|
|
"valid_targets_mean": 3519.6,
|
|
"valid_targets_min": 530
|
|
},
|
|
{
|
|
"epoch": 5.457364341085271,
|
|
"grad_norm": 0.45674225562117354,
|
|
"learning_rate": 5.643555873447677e-06,
|
|
"loss": 0.1408,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14884954690933228,
|
|
"step": 3520,
|
|
"valid_targets_mean": 4183.1,
|
|
"valid_targets_min": 764
|
|
},
|
|
{
|
|
"epoch": 5.465116279069767,
|
|
"grad_norm": 0.4035257697649145,
|
|
"learning_rate": 5.589829679738597e-06,
|
|
"loss": 0.1605,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1421164870262146,
|
|
"step": 3525,
|
|
"valid_targets_mean": 5205.2,
|
|
"valid_targets_min": 2073
|
|
},
|
|
{
|
|
"epoch": 5.4728682170542635,
|
|
"grad_norm": 0.5117576530097852,
|
|
"learning_rate": 5.536318870646587e-06,
|
|
"loss": 0.145,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16778147220611572,
|
|
"step": 3530,
|
|
"valid_targets_mean": 5321.6,
|
|
"valid_targets_min": 639
|
|
},
|
|
{
|
|
"epoch": 5.48062015503876,
|
|
"grad_norm": 0.4104772923087062,
|
|
"learning_rate": 5.483024245982116e-06,
|
|
"loss": 0.1562,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13928261399269104,
|
|
"step": 3535,
|
|
"valid_targets_mean": 4891.7,
|
|
"valid_targets_min": 410
|
|
},
|
|
{
|
|
"epoch": 5.488372093023256,
|
|
"grad_norm": 0.4268402728473486,
|
|
"learning_rate": 5.429946602324414e-06,
|
|
"loss": 0.1467,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1458597481250763,
|
|
"step": 3540,
|
|
"valid_targets_mean": 4448.0,
|
|
"valid_targets_min": 277
|
|
},
|
|
{
|
|
"epoch": 5.496124031007752,
|
|
"grad_norm": 0.4715412702854216,
|
|
"learning_rate": 5.377086733009551e-06,
|
|
"loss": 0.1421,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14967858791351318,
|
|
"step": 3545,
|
|
"valid_targets_mean": 4361.0,
|
|
"valid_targets_min": 704
|
|
},
|
|
{
|
|
"epoch": 5.503875968992248,
|
|
"grad_norm": 0.5279261179055396,
|
|
"learning_rate": 5.3244454281185984e-06,
|
|
"loss": 0.1689,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20234504342079163,
|
|
"step": 3550,
|
|
"valid_targets_mean": 3873.4,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 5.511627906976744,
|
|
"grad_norm": 0.507981142775861,
|
|
"learning_rate": 5.272023474465799e-06,
|
|
"loss": 0.1552,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1777733415365219,
|
|
"step": 3555,
|
|
"valid_targets_mean": 3797.2,
|
|
"valid_targets_min": 472
|
|
},
|
|
{
|
|
"epoch": 5.51937984496124,
|
|
"grad_norm": 0.3833421328022469,
|
|
"learning_rate": 5.219821655586821e-06,
|
|
"loss": 0.1471,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16572965681552887,
|
|
"step": 3560,
|
|
"valid_targets_mean": 5526.5,
|
|
"valid_targets_min": 551
|
|
},
|
|
{
|
|
"epoch": 5.5271317829457365,
|
|
"grad_norm": 0.43394338581146247,
|
|
"learning_rate": 5.167840751727034e-06,
|
|
"loss": 0.1497,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15046624839305878,
|
|
"step": 3565,
|
|
"valid_targets_mean": 4108.6,
|
|
"valid_targets_min": 536
|
|
},
|
|
{
|
|
"epoch": 5.534883720930233,
|
|
"grad_norm": 0.40622205843630427,
|
|
"learning_rate": 5.116081539829874e-06,
|
|
"loss": 0.1362,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16226355731487274,
|
|
"step": 3570,
|
|
"valid_targets_mean": 6044.9,
|
|
"valid_targets_min": 1779
|
|
},
|
|
{
|
|
"epoch": 5.542635658914729,
|
|
"grad_norm": 0.4029911479453827,
|
|
"learning_rate": 5.064544793525192e-06,
|
|
"loss": 0.1668,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14648669958114624,
|
|
"step": 3575,
|
|
"valid_targets_mean": 5268.5,
|
|
"valid_targets_min": 249
|
|
},
|
|
{
|
|
"epoch": 5.550387596899225,
|
|
"grad_norm": 0.5364248446568755,
|
|
"learning_rate": 5.013231283117723e-06,
|
|
"loss": 0.1486,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14924436807632446,
|
|
"step": 3580,
|
|
"valid_targets_mean": 4603.7,
|
|
"valid_targets_min": 2372
|
|
},
|
|
{
|
|
"epoch": 5.558139534883721,
|
|
"grad_norm": 0.40849395379526177,
|
|
"learning_rate": 4.962141775575553e-06,
|
|
"loss": 0.1457,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1340319961309433,
|
|
"step": 3585,
|
|
"valid_targets_mean": 4452.3,
|
|
"valid_targets_min": 2157
|
|
},
|
|
{
|
|
"epoch": 5.565891472868217,
|
|
"grad_norm": 0.3507387441886511,
|
|
"learning_rate": 4.9112770345186664e-06,
|
|
"loss": 0.1308,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10928727686405182,
|
|
"step": 3590,
|
|
"valid_targets_mean": 5409.7,
|
|
"valid_targets_min": 2109
|
|
},
|
|
{
|
|
"epoch": 5.573643410852713,
|
|
"grad_norm": 0.4457364584152074,
|
|
"learning_rate": 4.8606378202075215e-06,
|
|
"loss": 0.1421,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13773344457149506,
|
|
"step": 3595,
|
|
"valid_targets_mean": 4546.3,
|
|
"valid_targets_min": 327
|
|
},
|
|
{
|
|
"epoch": 5.5813953488372094,
|
|
"grad_norm": 0.4973298360537683,
|
|
"learning_rate": 4.81022488953171e-06,
|
|
"loss": 0.1382,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1543937474489212,
|
|
"step": 3600,
|
|
"valid_targets_mean": 4128.4,
|
|
"valid_targets_min": 349
|
|
},
|
|
{
|
|
"epoch": 5.589147286821706,
|
|
"grad_norm": 0.36859713218728013,
|
|
"learning_rate": 4.760038995998612e-06,
|
|
"loss": 0.1597,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14406907558441162,
|
|
"step": 3605,
|
|
"valid_targets_mean": 5601.7,
|
|
"valid_targets_min": 2213
|
|
},
|
|
{
|
|
"epoch": 5.596899224806202,
|
|
"grad_norm": 0.3775608828670771,
|
|
"learning_rate": 4.710080889722157e-06,
|
|
"loss": 0.1379,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11484645307064056,
|
|
"step": 3610,
|
|
"valid_targets_mean": 4418.9,
|
|
"valid_targets_min": 781
|
|
},
|
|
{
|
|
"epoch": 5.604651162790698,
|
|
"grad_norm": 0.5585581576269192,
|
|
"learning_rate": 4.660351317411598e-06,
|
|
"loss": 0.1546,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16293855011463165,
|
|
"step": 3615,
|
|
"valid_targets_mean": 3673.5,
|
|
"valid_targets_min": 853
|
|
},
|
|
{
|
|
"epoch": 5.612403100775194,
|
|
"grad_norm": 0.40317305487140387,
|
|
"learning_rate": 4.610851022360372e-06,
|
|
"loss": 0.1472,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16022725403308868,
|
|
"step": 3620,
|
|
"valid_targets_mean": 5046.8,
|
|
"valid_targets_min": 719
|
|
},
|
|
{
|
|
"epoch": 5.62015503875969,
|
|
"grad_norm": 0.46629312553258945,
|
|
"learning_rate": 4.561580744434962e-06,
|
|
"loss": 0.1363,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16484293341636658,
|
|
"step": 3625,
|
|
"valid_targets_mean": 4345.7,
|
|
"valid_targets_min": 719
|
|
},
|
|
{
|
|
"epoch": 5.627906976744186,
|
|
"grad_norm": 0.4517994866451772,
|
|
"learning_rate": 4.512541220063849e-06,
|
|
"loss": 0.1583,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1768956333398819,
|
|
"step": 3630,
|
|
"valid_targets_mean": 5144.0,
|
|
"valid_targets_min": 1570
|
|
},
|
|
{
|
|
"epoch": 5.635658914728682,
|
|
"grad_norm": 0.4266612314681182,
|
|
"learning_rate": 4.463733182226526e-06,
|
|
"loss": 0.1441,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12670007348060608,
|
|
"step": 3635,
|
|
"valid_targets_mean": 4100.2,
|
|
"valid_targets_min": 2116
|
|
},
|
|
{
|
|
"epoch": 5.6434108527131785,
|
|
"grad_norm": 0.4680346659273191,
|
|
"learning_rate": 4.415157360442517e-06,
|
|
"loss": 0.16,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17845088243484497,
|
|
"step": 3640,
|
|
"valid_targets_mean": 4356.6,
|
|
"valid_targets_min": 322
|
|
},
|
|
{
|
|
"epoch": 5.651162790697675,
|
|
"grad_norm": 0.3890028520850903,
|
|
"learning_rate": 4.366814480760461e-06,
|
|
"loss": 0.1435,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12099163234233856,
|
|
"step": 3645,
|
|
"valid_targets_mean": 5003.2,
|
|
"valid_targets_min": 2596
|
|
},
|
|
{
|
|
"epoch": 5.658914728682171,
|
|
"grad_norm": 0.5488303595169921,
|
|
"learning_rate": 4.318705265747298e-06,
|
|
"loss": 0.1572,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1828697919845581,
|
|
"step": 3650,
|
|
"valid_targets_mean": 3999.2,
|
|
"valid_targets_min": 528
|
|
},
|
|
{
|
|
"epoch": 5.666666666666667,
|
|
"grad_norm": 0.42060572333330015,
|
|
"learning_rate": 4.2708304344774554e-06,
|
|
"loss": 0.1384,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13645608723163605,
|
|
"step": 3655,
|
|
"valid_targets_mean": 4687.2,
|
|
"valid_targets_min": 2741
|
|
},
|
|
{
|
|
"epoch": 5.674418604651163,
|
|
"grad_norm": 0.4387274771557827,
|
|
"learning_rate": 4.223190702522084e-06,
|
|
"loss": 0.1453,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14829561114311218,
|
|
"step": 3660,
|
|
"valid_targets_mean": 4422.6,
|
|
"valid_targets_min": 757
|
|
},
|
|
{
|
|
"epoch": 5.682170542635659,
|
|
"grad_norm": 0.38684240070794124,
|
|
"learning_rate": 4.1757867819383695e-06,
|
|
"loss": 0.1485,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15705367922782898,
|
|
"step": 3665,
|
|
"valid_targets_mean": 5591.4,
|
|
"valid_targets_min": 2183
|
|
},
|
|
{
|
|
"epoch": 5.689922480620155,
|
|
"grad_norm": 0.3924859326932451,
|
|
"learning_rate": 4.128619381258914e-06,
|
|
"loss": 0.1559,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1718716323375702,
|
|
"step": 3670,
|
|
"valid_targets_mean": 5566.4,
|
|
"valid_targets_min": 344
|
|
},
|
|
{
|
|
"epoch": 5.6976744186046515,
|
|
"grad_norm": 0.4255325828911711,
|
|
"learning_rate": 4.081689205481103e-06,
|
|
"loss": 0.1409,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15730968117713928,
|
|
"step": 3675,
|
|
"valid_targets_mean": 4940.1,
|
|
"valid_targets_min": 2527
|
|
},
|
|
{
|
|
"epoch": 5.705426356589148,
|
|
"grad_norm": 0.4523673615926739,
|
|
"learning_rate": 4.034996956056596e-06,
|
|
"loss": 0.1613,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17630687355995178,
|
|
"step": 3680,
|
|
"valid_targets_mean": 4730.1,
|
|
"valid_targets_min": 836
|
|
},
|
|
{
|
|
"epoch": 5.713178294573644,
|
|
"grad_norm": 0.3996998930591703,
|
|
"learning_rate": 3.988543330880852e-06,
|
|
"loss": 0.1287,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12216873466968536,
|
|
"step": 3685,
|
|
"valid_targets_mean": 4865.8,
|
|
"valid_targets_min": 2765
|
|
},
|
|
{
|
|
"epoch": 5.720930232558139,
|
|
"grad_norm": 0.47040209067719235,
|
|
"learning_rate": 3.942329024282665e-06,
|
|
"loss": 0.1516,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16137559711933136,
|
|
"step": 3690,
|
|
"valid_targets_mean": 4531.0,
|
|
"valid_targets_min": 730
|
|
},
|
|
{
|
|
"epoch": 5.728682170542635,
|
|
"grad_norm": 0.3630897503273467,
|
|
"learning_rate": 3.896354727013811e-06,
|
|
"loss": 0.1532,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12590524554252625,
|
|
"step": 3695,
|
|
"valid_targets_mean": 5248.6,
|
|
"valid_targets_min": 2452
|
|
},
|
|
{
|
|
"epoch": 5.736434108527131,
|
|
"grad_norm": 0.4715032977447836,
|
|
"learning_rate": 3.850621126238716e-06,
|
|
"loss": 0.1437,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15132960677146912,
|
|
"step": 3700,
|
|
"valid_targets_mean": 3941.0,
|
|
"valid_targets_min": 325
|
|
},
|
|
{
|
|
"epoch": 5.7441860465116275,
|
|
"grad_norm": 0.4654118997053404,
|
|
"learning_rate": 3.8051289055241825e-06,
|
|
"loss": 0.162,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1751362681388855,
|
|
"step": 3705,
|
|
"valid_targets_mean": 4353.2,
|
|
"valid_targets_min": 2659
|
|
},
|
|
{
|
|
"epoch": 5.751937984496124,
|
|
"grad_norm": 0.5227568375922278,
|
|
"learning_rate": 3.759878744829182e-06,
|
|
"loss": 0.16,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18965643644332886,
|
|
"step": 3710,
|
|
"valid_targets_mean": 4459.4,
|
|
"valid_targets_min": 733
|
|
},
|
|
{
|
|
"epoch": 5.75968992248062,
|
|
"grad_norm": 0.4609905003497403,
|
|
"learning_rate": 3.7148713204946752e-06,
|
|
"loss": 0.147,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1515987515449524,
|
|
"step": 3715,
|
|
"valid_targets_mean": 4371.8,
|
|
"valid_targets_min": 621
|
|
},
|
|
{
|
|
"epoch": 5.767441860465116,
|
|
"grad_norm": 0.3918991200592125,
|
|
"learning_rate": 3.67010730523353e-06,
|
|
"loss": 0.1618,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12248925864696503,
|
|
"step": 3720,
|
|
"valid_targets_mean": 4360.6,
|
|
"valid_targets_min": 370
|
|
},
|
|
{
|
|
"epoch": 5.775193798449612,
|
|
"grad_norm": 0.467773056692704,
|
|
"learning_rate": 3.6255873681204332e-06,
|
|
"loss": 0.1566,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17771819233894348,
|
|
"step": 3725,
|
|
"valid_targets_mean": 4304.9,
|
|
"valid_targets_min": 288
|
|
},
|
|
{
|
|
"epoch": 5.782945736434108,
|
|
"grad_norm": 0.377912933539592,
|
|
"learning_rate": 3.5813121745819144e-06,
|
|
"loss": 0.1529,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14115823805332184,
|
|
"step": 3730,
|
|
"valid_targets_mean": 4955.0,
|
|
"valid_targets_min": 285
|
|
},
|
|
{
|
|
"epoch": 5.790697674418604,
|
|
"grad_norm": 0.3996511259289835,
|
|
"learning_rate": 3.537282386386387e-06,
|
|
"loss": 0.1561,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13390158116817474,
|
|
"step": 3735,
|
|
"valid_targets_mean": 4518.8,
|
|
"valid_targets_min": 339
|
|
},
|
|
{
|
|
"epoch": 5.7984496124031,
|
|
"grad_norm": 0.3701488362865712,
|
|
"learning_rate": 3.4934986616342737e-06,
|
|
"loss": 0.1768,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14555737376213074,
|
|
"step": 3740,
|
|
"valid_targets_mean": 5657.8,
|
|
"valid_targets_min": 2347
|
|
},
|
|
{
|
|
"epoch": 5.8062015503875966,
|
|
"grad_norm": 0.45199830351728787,
|
|
"learning_rate": 3.449961654748146e-06,
|
|
"loss": 0.1487,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.150042325258255,
|
|
"step": 3745,
|
|
"valid_targets_mean": 4127.3,
|
|
"valid_targets_min": 2290
|
|
},
|
|
{
|
|
"epoch": 5.813953488372093,
|
|
"grad_norm": 0.4369336909116495,
|
|
"learning_rate": 3.406672016462964e-06,
|
|
"loss": 0.1463,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13401828706264496,
|
|
"step": 3750,
|
|
"valid_targets_mean": 4274.8,
|
|
"valid_targets_min": 1856
|
|
},
|
|
{
|
|
"epoch": 5.821705426356589,
|
|
"grad_norm": 0.4834110812261461,
|
|
"learning_rate": 3.363630393816335e-06,
|
|
"loss": 0.1402,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15827834606170654,
|
|
"step": 3755,
|
|
"valid_targets_mean": 3873.9,
|
|
"valid_targets_min": 2432
|
|
},
|
|
{
|
|
"epoch": 5.829457364341085,
|
|
"grad_norm": 0.4597445261763014,
|
|
"learning_rate": 3.3208374301388504e-06,
|
|
"loss": 0.1627,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17994539439678192,
|
|
"step": 3760,
|
|
"valid_targets_mean": 4758.0,
|
|
"valid_targets_min": 1984
|
|
},
|
|
{
|
|
"epoch": 5.837209302325581,
|
|
"grad_norm": 0.42360510165536924,
|
|
"learning_rate": 3.278293765044469e-06,
|
|
"loss": 0.1546,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13492318987846375,
|
|
"step": 3765,
|
|
"valid_targets_mean": 4426.1,
|
|
"valid_targets_min": 233
|
|
},
|
|
{
|
|
"epoch": 5.844961240310077,
|
|
"grad_norm": 0.48922365457669503,
|
|
"learning_rate": 3.236000034420963e-06,
|
|
"loss": 0.1498,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14569556713104248,
|
|
"step": 3770,
|
|
"valid_targets_mean": 3687.8,
|
|
"valid_targets_min": 242
|
|
},
|
|
{
|
|
"epoch": 5.852713178294573,
|
|
"grad_norm": 0.4033773146053126,
|
|
"learning_rate": 3.193956870420396e-06,
|
|
"loss": 0.1738,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18744111061096191,
|
|
"step": 3775,
|
|
"valid_targets_mean": 5528.1,
|
|
"valid_targets_min": 611
|
|
},
|
|
{
|
|
"epoch": 5.8604651162790695,
|
|
"grad_norm": 0.34857475686830064,
|
|
"learning_rate": 3.1521649014496925e-06,
|
|
"loss": 0.155,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13359975814819336,
|
|
"step": 3780,
|
|
"valid_targets_mean": 5863.0,
|
|
"valid_targets_min": 2553
|
|
},
|
|
{
|
|
"epoch": 5.868217054263566,
|
|
"grad_norm": 0.4313376511492457,
|
|
"learning_rate": 3.110624752161229e-06,
|
|
"loss": 0.1689,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13781484961509705,
|
|
"step": 3785,
|
|
"valid_targets_mean": 5246.6,
|
|
"valid_targets_min": 578
|
|
},
|
|
{
|
|
"epoch": 5.875968992248062,
|
|
"grad_norm": 0.35972262523748805,
|
|
"learning_rate": 3.069337043443523e-06,
|
|
"loss": 0.1552,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1296289563179016,
|
|
"step": 3790,
|
|
"valid_targets_mean": 5488.9,
|
|
"valid_targets_min": 1966
|
|
},
|
|
{
|
|
"epoch": 5.883720930232558,
|
|
"grad_norm": 0.46395239595319404,
|
|
"learning_rate": 3.0283023924119236e-06,
|
|
"loss": 0.1425,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1438305675983429,
|
|
"step": 3795,
|
|
"valid_targets_mean": 5045.4,
|
|
"valid_targets_min": 548
|
|
},
|
|
{
|
|
"epoch": 5.891472868217054,
|
|
"grad_norm": 0.4216115298877531,
|
|
"learning_rate": 2.9875214123993967e-06,
|
|
"loss": 0.1489,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13032379746437073,
|
|
"step": 3800,
|
|
"valid_targets_mean": 5036.0,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 5.89922480620155,
|
|
"grad_norm": 0.369645204601132,
|
|
"learning_rate": 2.94699471294738e-06,
|
|
"loss": 0.1474,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10359348356723785,
|
|
"step": 3805,
|
|
"valid_targets_mean": 4782.0,
|
|
"valid_targets_min": 395
|
|
},
|
|
{
|
|
"epoch": 5.906976744186046,
|
|
"grad_norm": 0.4329223252021753,
|
|
"learning_rate": 2.9067228997966347e-06,
|
|
"loss": 0.1488,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14920011162757874,
|
|
"step": 3810,
|
|
"valid_targets_mean": 4213.8,
|
|
"valid_targets_min": 265
|
|
},
|
|
{
|
|
"epoch": 5.9147286821705425,
|
|
"grad_norm": 0.38061473387366296,
|
|
"learning_rate": 2.8667065748782177e-06,
|
|
"loss": 0.1552,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11807483434677124,
|
|
"step": 3815,
|
|
"valid_targets_mean": 4682.1,
|
|
"valid_targets_min": 2866
|
|
},
|
|
{
|
|
"epoch": 5.922480620155039,
|
|
"grad_norm": 0.4630422264492311,
|
|
"learning_rate": 2.826946336304481e-06,
|
|
"loss": 0.1606,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1536155343055725,
|
|
"step": 3820,
|
|
"valid_targets_mean": 4259.2,
|
|
"valid_targets_min": 826
|
|
},
|
|
{
|
|
"epoch": 5.930232558139535,
|
|
"grad_norm": 0.4336604749432643,
|
|
"learning_rate": 2.7874427783601234e-06,
|
|
"loss": 0.1443,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13880223035812378,
|
|
"step": 3825,
|
|
"valid_targets_mean": 4519.3,
|
|
"valid_targets_min": 609
|
|
},
|
|
{
|
|
"epoch": 5.937984496124031,
|
|
"grad_norm": 0.5243528481538801,
|
|
"learning_rate": 2.7481964914933157e-06,
|
|
"loss": 0.1604,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17028310894966125,
|
|
"step": 3830,
|
|
"valid_targets_mean": 3623.1,
|
|
"valid_targets_min": 591
|
|
},
|
|
{
|
|
"epoch": 5.945736434108527,
|
|
"grad_norm": 0.4789980300582059,
|
|
"learning_rate": 2.7092080623068674e-06,
|
|
"loss": 0.1745,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1756812334060669,
|
|
"step": 3835,
|
|
"valid_targets_mean": 4744.0,
|
|
"valid_targets_min": 772
|
|
},
|
|
{
|
|
"epoch": 5.953488372093023,
|
|
"grad_norm": 0.45611253393283935,
|
|
"learning_rate": 2.6704780735494784e-06,
|
|
"loss": 0.1441,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1426219344139099,
|
|
"step": 3840,
|
|
"valid_targets_mean": 4248.6,
|
|
"valid_targets_min": 525
|
|
},
|
|
{
|
|
"epoch": 5.961240310077519,
|
|
"grad_norm": 0.3857782088985867,
|
|
"learning_rate": 2.6320071041070018e-06,
|
|
"loss": 0.1479,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11612827330827713,
|
|
"step": 3845,
|
|
"valid_targets_mean": 4773.6,
|
|
"valid_targets_min": 2511
|
|
},
|
|
{
|
|
"epoch": 5.9689922480620154,
|
|
"grad_norm": 0.4166115486481006,
|
|
"learning_rate": 2.593795728993804e-06,
|
|
"loss": 0.1544,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18450096249580383,
|
|
"step": 3850,
|
|
"valid_targets_mean": 5148.2,
|
|
"valid_targets_min": 2061
|
|
},
|
|
{
|
|
"epoch": 5.976744186046512,
|
|
"grad_norm": 0.4335144952819728,
|
|
"learning_rate": 2.555844519344186e-06,
|
|
"loss": 0.1444,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1622152328491211,
|
|
"step": 3855,
|
|
"valid_targets_mean": 5090.6,
|
|
"valid_targets_min": 790
|
|
},
|
|
{
|
|
"epoch": 5.984496124031008,
|
|
"grad_norm": 0.3565273610492274,
|
|
"learning_rate": 2.518154042403813e-06,
|
|
"loss": 0.1408,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12373974919319153,
|
|
"step": 3860,
|
|
"valid_targets_mean": 5277.1,
|
|
"valid_targets_min": 2691
|
|
},
|
|
{
|
|
"epoch": 5.992248062015504,
|
|
"grad_norm": 0.36972590062662825,
|
|
"learning_rate": 2.480724861521264e-06,
|
|
"loss": 0.1588,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10760015994310379,
|
|
"step": 3865,
|
|
"valid_targets_mean": 4705.8,
|
|
"valid_targets_min": 2256
|
|
},
|
|
{
|
|
"epoch": 6.0,
|
|
"grad_norm": 0.3774316986540542,
|
|
"learning_rate": 2.443557536139598e-06,
|
|
"loss": 0.1449,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13823938369750977,
|
|
"step": 3870,
|
|
"valid_targets_mean": 5121.6,
|
|
"valid_targets_min": 2951
|
|
},
|
|
{
|
|
"epoch": 6.007751937984496,
|
|
"grad_norm": 0.4491491812525188,
|
|
"learning_rate": 2.406652621787999e-06,
|
|
"loss": 0.1461,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1544957160949707,
|
|
"step": 3875,
|
|
"valid_targets_mean": 3907.7,
|
|
"valid_targets_min": 472
|
|
},
|
|
{
|
|
"epoch": 6.015503875968992,
|
|
"grad_norm": 0.39058530830234023,
|
|
"learning_rate": 2.3700106700734705e-06,
|
|
"loss": 0.1501,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11147475242614746,
|
|
"step": 3880,
|
|
"valid_targets_mean": 4658.1,
|
|
"valid_targets_min": 412
|
|
},
|
|
{
|
|
"epoch": 6.023255813953488,
|
|
"grad_norm": 0.4764404360508427,
|
|
"learning_rate": 2.3336322286725823e-06,
|
|
"loss": 0.1365,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1638670563697815,
|
|
"step": 3885,
|
|
"valid_targets_mean": 3920.1,
|
|
"valid_targets_min": 792
|
|
},
|
|
{
|
|
"epoch": 6.0310077519379846,
|
|
"grad_norm": 0.41031515357008064,
|
|
"learning_rate": 2.2975178413233047e-06,
|
|
"loss": 0.1426,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11806363612413406,
|
|
"step": 3890,
|
|
"valid_targets_mean": 4190.1,
|
|
"valid_targets_min": 2164
|
|
},
|
|
{
|
|
"epoch": 6.038759689922481,
|
|
"grad_norm": 0.4080067588790369,
|
|
"learning_rate": 2.261668047816863e-06,
|
|
"loss": 0.1442,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16606493294239044,
|
|
"step": 3895,
|
|
"valid_targets_mean": 5487.4,
|
|
"valid_targets_min": 272
|
|
},
|
|
{
|
|
"epoch": 6.046511627906977,
|
|
"grad_norm": 0.4182771476362144,
|
|
"learning_rate": 2.226083383989668e-06,
|
|
"loss": 0.1454,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12919700145721436,
|
|
"step": 3900,
|
|
"valid_targets_mean": 4410.3,
|
|
"valid_targets_min": 453
|
|
},
|
|
{
|
|
"epoch": 6.054263565891473,
|
|
"grad_norm": 0.465578156889018,
|
|
"learning_rate": 2.1907643817153313e-06,
|
|
"loss": 0.1429,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1524408608675003,
|
|
"step": 3905,
|
|
"valid_targets_mean": 4006.7,
|
|
"valid_targets_min": 402
|
|
},
|
|
{
|
|
"epoch": 6.062015503875969,
|
|
"grad_norm": 0.49003831755013766,
|
|
"learning_rate": 2.1557115688966835e-06,
|
|
"loss": 0.1466,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15983235836029053,
|
|
"step": 3910,
|
|
"valid_targets_mean": 3748.0,
|
|
"valid_targets_min": 1984
|
|
},
|
|
{
|
|
"epoch": 6.069767441860465,
|
|
"grad_norm": 0.4793985294195704,
|
|
"learning_rate": 2.120925469457904e-06,
|
|
"loss": 0.1492,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1331721544265747,
|
|
"step": 3915,
|
|
"valid_targets_mean": 3765.6,
|
|
"valid_targets_min": 1989
|
|
},
|
|
{
|
|
"epoch": 6.077519379844961,
|
|
"grad_norm": 0.4857730761757885,
|
|
"learning_rate": 2.086406603336686e-06,
|
|
"loss": 0.162,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.223957359790802,
|
|
"step": 3920,
|
|
"valid_targets_mean": 4345.2,
|
|
"valid_targets_min": 487
|
|
},
|
|
{
|
|
"epoch": 6.0852713178294575,
|
|
"grad_norm": 0.38478031129260776,
|
|
"learning_rate": 2.052155486476466e-06,
|
|
"loss": 0.1401,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.141106978058815,
|
|
"step": 3925,
|
|
"valid_targets_mean": 5665.4,
|
|
"valid_targets_min": 1766
|
|
},
|
|
{
|
|
"epoch": 6.093023255813954,
|
|
"grad_norm": 0.572101341083877,
|
|
"learning_rate": 2.0181726308187044e-06,
|
|
"loss": 0.1537,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16148856282234192,
|
|
"step": 3930,
|
|
"valid_targets_mean": 3327.9,
|
|
"valid_targets_min": 393
|
|
},
|
|
{
|
|
"epoch": 6.10077519379845,
|
|
"grad_norm": 0.5702565613060158,
|
|
"learning_rate": 1.984458544295247e-06,
|
|
"loss": 0.1491,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15981945395469666,
|
|
"step": 3935,
|
|
"valid_targets_mean": 3374.9,
|
|
"valid_targets_min": 665
|
|
},
|
|
{
|
|
"epoch": 6.108527131782946,
|
|
"grad_norm": 0.41153314259954854,
|
|
"learning_rate": 1.9510137308207187e-06,
|
|
"loss": 0.144,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14380812644958496,
|
|
"step": 3940,
|
|
"valid_targets_mean": 4357.6,
|
|
"valid_targets_min": 343
|
|
},
|
|
{
|
|
"epoch": 6.116279069767442,
|
|
"grad_norm": 0.42473098729111763,
|
|
"learning_rate": 1.9178386902850033e-06,
|
|
"loss": 0.1416,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12821288406848907,
|
|
"step": 3945,
|
|
"valid_targets_mean": 3923.3,
|
|
"valid_targets_min": 266
|
|
},
|
|
{
|
|
"epoch": 6.124031007751938,
|
|
"grad_norm": 0.4233818856902045,
|
|
"learning_rate": 1.884933918545766e-06,
|
|
"loss": 0.1382,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14326541125774384,
|
|
"step": 3950,
|
|
"valid_targets_mean": 4490.9,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 6.131782945736434,
|
|
"grad_norm": 0.4075534532593769,
|
|
"learning_rate": 1.8522999074210357e-06,
|
|
"loss": 0.1425,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13676217198371887,
|
|
"step": 3955,
|
|
"valid_targets_mean": 5278.7,
|
|
"valid_targets_min": 773
|
|
},
|
|
{
|
|
"epoch": 6.1395348837209305,
|
|
"grad_norm": 0.4831447381224601,
|
|
"learning_rate": 1.819937144681876e-06,
|
|
"loss": 0.1481,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14638128876686096,
|
|
"step": 3960,
|
|
"valid_targets_mean": 4841.4,
|
|
"valid_targets_min": 1843
|
|
},
|
|
{
|
|
"epoch": 6.147286821705427,
|
|
"grad_norm": 0.5692373377592979,
|
|
"learning_rate": 1.7878461140450709e-06,
|
|
"loss": 0.146,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17473667860031128,
|
|
"step": 3965,
|
|
"valid_targets_mean": 3916.5,
|
|
"valid_targets_min": 1954
|
|
},
|
|
{
|
|
"epoch": 6.155038759689923,
|
|
"grad_norm": 0.4411787512540076,
|
|
"learning_rate": 1.7560272951659007e-06,
|
|
"loss": 0.1499,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16196417808532715,
|
|
"step": 3970,
|
|
"valid_targets_mean": 4841.2,
|
|
"valid_targets_min": 681
|
|
},
|
|
{
|
|
"epoch": 6.162790697674419,
|
|
"grad_norm": 0.4144797822314153,
|
|
"learning_rate": 1.7244811636309865e-06,
|
|
"loss": 0.1459,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12838700413703918,
|
|
"step": 3975,
|
|
"valid_targets_mean": 5786.5,
|
|
"valid_targets_min": 536
|
|
},
|
|
{
|
|
"epoch": 6.170542635658915,
|
|
"grad_norm": 0.4579031301080518,
|
|
"learning_rate": 1.693208190951159e-06,
|
|
"loss": 0.148,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1469820737838745,
|
|
"step": 3980,
|
|
"valid_targets_mean": 4262.1,
|
|
"valid_targets_min": 2558
|
|
},
|
|
{
|
|
"epoch": 6.178294573643411,
|
|
"grad_norm": 0.35185050016875424,
|
|
"learning_rate": 1.6622088445544337e-06,
|
|
"loss": 0.1488,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.129560187458992,
|
|
"step": 3985,
|
|
"valid_targets_mean": 5511.1,
|
|
"valid_targets_min": 710
|
|
},
|
|
{
|
|
"epoch": 6.186046511627907,
|
|
"grad_norm": 0.41851723149449205,
|
|
"learning_rate": 1.6314835877790035e-06,
|
|
"loss": 0.141,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15272796154022217,
|
|
"step": 3990,
|
|
"valid_targets_mean": 4655.8,
|
|
"valid_targets_min": 332
|
|
},
|
|
{
|
|
"epoch": 6.1937984496124034,
|
|
"grad_norm": 0.40076139878422207,
|
|
"learning_rate": 1.6010328798663332e-06,
|
|
"loss": 0.1481,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12933820486068726,
|
|
"step": 3995,
|
|
"valid_targets_mean": 5362.1,
|
|
"valid_targets_min": 3053
|
|
},
|
|
{
|
|
"epoch": 6.2015503875969,
|
|
"grad_norm": 0.45341665170317824,
|
|
"learning_rate": 1.570857175954279e-06,
|
|
"loss": 0.1637,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12798666954040527,
|
|
"step": 4000,
|
|
"valid_targets_mean": 4509.7,
|
|
"valid_targets_min": 489
|
|
},
|
|
{
|
|
"epoch": 6.209302325581396,
|
|
"grad_norm": 0.3607620367511857,
|
|
"learning_rate": 1.540956927070294e-06,
|
|
"loss": 0.128,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11347877979278564,
|
|
"step": 4005,
|
|
"valid_targets_mean": 5619.4,
|
|
"valid_targets_min": 2424
|
|
},
|
|
{
|
|
"epoch": 6.217054263565892,
|
|
"grad_norm": 0.5026070546003747,
|
|
"learning_rate": 1.5113325801246914e-06,
|
|
"loss": 0.1531,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18720689415931702,
|
|
"step": 4010,
|
|
"valid_targets_mean": 4427.4,
|
|
"valid_targets_min": 1430
|
|
},
|
|
{
|
|
"epoch": 6.224806201550388,
|
|
"grad_norm": 0.43575139062965373,
|
|
"learning_rate": 1.4819845779039477e-06,
|
|
"loss": 0.1657,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1679738312959671,
|
|
"step": 4015,
|
|
"valid_targets_mean": 5928.5,
|
|
"valid_targets_min": 808
|
|
},
|
|
{
|
|
"epoch": 6.232558139534884,
|
|
"grad_norm": 0.42143605193627004,
|
|
"learning_rate": 1.4529133590641009e-06,
|
|
"loss": 0.1343,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13898807764053345,
|
|
"step": 4020,
|
|
"valid_targets_mean": 4824.2,
|
|
"valid_targets_min": 1828
|
|
},
|
|
{
|
|
"epoch": 6.24031007751938,
|
|
"grad_norm": 0.4220444192180161,
|
|
"learning_rate": 1.4241193581241964e-06,
|
|
"loss": 0.1369,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12464825809001923,
|
|
"step": 4025,
|
|
"valid_targets_mean": 4312.4,
|
|
"valid_targets_min": 280
|
|
},
|
|
{
|
|
"epoch": 6.248062015503876,
|
|
"grad_norm": 0.4246528594263321,
|
|
"learning_rate": 1.395603005459769e-06,
|
|
"loss": 0.1514,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11180758476257324,
|
|
"step": 4030,
|
|
"valid_targets_mean": 5064.3,
|
|
"valid_targets_min": 268
|
|
},
|
|
{
|
|
"epoch": 6.2558139534883725,
|
|
"grad_norm": 0.4601989305033969,
|
|
"learning_rate": 1.367364727296434e-06,
|
|
"loss": 0.1391,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17486141622066498,
|
|
"step": 4035,
|
|
"valid_targets_mean": 4553.9,
|
|
"valid_targets_min": 455
|
|
},
|
|
{
|
|
"epoch": 6.263565891472869,
|
|
"grad_norm": 0.41743085880863806,
|
|
"learning_rate": 1.3394049457035063e-06,
|
|
"loss": 0.1271,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11269478499889374,
|
|
"step": 4040,
|
|
"valid_targets_mean": 4022.4,
|
|
"valid_targets_min": 396
|
|
},
|
|
{
|
|
"epoch": 6.271317829457364,
|
|
"grad_norm": 0.3957905593683059,
|
|
"learning_rate": 1.3117240785876994e-06,
|
|
"loss": 0.1397,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1279354691505432,
|
|
"step": 4045,
|
|
"valid_targets_mean": 4760.3,
|
|
"valid_targets_min": 573
|
|
},
|
|
{
|
|
"epoch": 6.27906976744186,
|
|
"grad_norm": 0.46939606376712706,
|
|
"learning_rate": 1.2843225396868707e-06,
|
|
"loss": 0.1278,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14345014095306396,
|
|
"step": 4050,
|
|
"valid_targets_mean": 3840.0,
|
|
"valid_targets_min": 977
|
|
},
|
|
{
|
|
"epoch": 6.286821705426356,
|
|
"grad_norm": 0.45118172267262807,
|
|
"learning_rate": 1.2572007385638264e-06,
|
|
"loss": 0.1409,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13466718792915344,
|
|
"step": 4055,
|
|
"valid_targets_mean": 5589.4,
|
|
"valid_targets_min": 2910
|
|
},
|
|
{
|
|
"epoch": 6.294573643410852,
|
|
"grad_norm": 0.47093501864092696,
|
|
"learning_rate": 1.2303590806002341e-06,
|
|
"loss": 0.138,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17266318202018738,
|
|
"step": 4060,
|
|
"valid_targets_mean": 4088.8,
|
|
"valid_targets_min": 1934
|
|
},
|
|
{
|
|
"epoch": 6.3023255813953485,
|
|
"grad_norm": 0.43593257987581496,
|
|
"learning_rate": 1.2037979669905341e-06,
|
|
"loss": 0.1462,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1565391570329666,
|
|
"step": 4065,
|
|
"valid_targets_mean": 5561.3,
|
|
"valid_targets_min": 2171
|
|
},
|
|
{
|
|
"epoch": 6.310077519379845,
|
|
"grad_norm": 0.38442258109857474,
|
|
"learning_rate": 1.1775177947359472e-06,
|
|
"loss": 0.1469,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.120355024933815,
|
|
"step": 4070,
|
|
"valid_targets_mean": 5508.9,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 6.317829457364341,
|
|
"grad_norm": 0.5116245670615639,
|
|
"learning_rate": 1.1515189566385598e-06,
|
|
"loss": 0.1536,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15075933933258057,
|
|
"step": 4075,
|
|
"valid_targets_mean": 3669.8,
|
|
"valid_targets_min": 289
|
|
},
|
|
{
|
|
"epoch": 6.325581395348837,
|
|
"grad_norm": 0.519726609280829,
|
|
"learning_rate": 1.125801841295422e-06,
|
|
"loss": 0.1538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1663362681865692,
|
|
"step": 4080,
|
|
"valid_targets_mean": 3507.8,
|
|
"valid_targets_min": 755
|
|
},
|
|
{
|
|
"epoch": 6.333333333333333,
|
|
"grad_norm": 0.5066281048339958,
|
|
"learning_rate": 1.1003668330927674e-06,
|
|
"loss": 0.1561,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17226609587669373,
|
|
"step": 4085,
|
|
"valid_targets_mean": 3913.7,
|
|
"valid_targets_min": 891
|
|
},
|
|
{
|
|
"epoch": 6.341085271317829,
|
|
"grad_norm": 0.4168253714412732,
|
|
"learning_rate": 1.0752143122002502e-06,
|
|
"loss": 0.1549,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13902395963668823,
|
|
"step": 4090,
|
|
"valid_targets_mean": 4731.2,
|
|
"valid_targets_min": 310
|
|
},
|
|
{
|
|
"epoch": 6.348837209302325,
|
|
"grad_norm": 0.3943285404063543,
|
|
"learning_rate": 1.0503446545652718e-06,
|
|
"loss": 0.1437,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13005225360393524,
|
|
"step": 4095,
|
|
"valid_targets_mean": 4982.7,
|
|
"valid_targets_min": 575
|
|
},
|
|
{
|
|
"epoch": 6.3565891472868215,
|
|
"grad_norm": 0.4120867129337237,
|
|
"learning_rate": 1.0257582319073612e-06,
|
|
"loss": 0.1276,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11511364579200745,
|
|
"step": 4100,
|
|
"valid_targets_mean": 4254.6,
|
|
"valid_targets_min": 869
|
|
},
|
|
{
|
|
"epoch": 6.364341085271318,
|
|
"grad_norm": 0.44941410097724094,
|
|
"learning_rate": 1.001455411712613e-06,
|
|
"loss": 0.1475,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14647594094276428,
|
|
"step": 4105,
|
|
"valid_targets_mean": 4231.6,
|
|
"valid_targets_min": 709
|
|
},
|
|
{
|
|
"epoch": 6.372093023255814,
|
|
"grad_norm": 0.38228475170706705,
|
|
"learning_rate": 9.774365572281973e-07,
|
|
"loss": 0.1393,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12529915571212769,
|
|
"step": 4110,
|
|
"valid_targets_mean": 5377.4,
|
|
"valid_targets_min": 2890
|
|
},
|
|
{
|
|
"epoch": 6.37984496124031,
|
|
"grad_norm": 0.40870796264529896,
|
|
"learning_rate": 9.537020274569376e-07,
|
|
"loss": 0.1378,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1220163106918335,
|
|
"step": 4115,
|
|
"valid_targets_mean": 4960.4,
|
|
"valid_targets_min": 617
|
|
},
|
|
{
|
|
"epoch": 6.387596899224806,
|
|
"grad_norm": 0.4785371009759146,
|
|
"learning_rate": 9.302521771519291e-07,
|
|
"loss": 0.1724,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15229693055152893,
|
|
"step": 4120,
|
|
"valid_targets_mean": 4179.5,
|
|
"valid_targets_min": 794
|
|
},
|
|
{
|
|
"epoch": 6.395348837209302,
|
|
"grad_norm": 0.5482438722247103,
|
|
"learning_rate": 9.070873568112537e-07,
|
|
"loss": 0.1715,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20323488116264343,
|
|
"step": 4125,
|
|
"valid_targets_mean": 3866.2,
|
|
"valid_targets_min": 528
|
|
},
|
|
{
|
|
"epoch": 6.403100775193798,
|
|
"grad_norm": 0.34393102511247997,
|
|
"learning_rate": 8.842079126727365e-07,
|
|
"loss": 0.1438,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17043393850326538,
|
|
"step": 4130,
|
|
"valid_targets_mean": 8063.3,
|
|
"valid_targets_min": 1395
|
|
},
|
|
{
|
|
"epoch": 6.410852713178294,
|
|
"grad_norm": 0.48778735386271366,
|
|
"learning_rate": 8.616141867087569e-07,
|
|
"loss": 0.1415,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1254102885723114,
|
|
"step": 4135,
|
|
"valid_targets_mean": 4153.1,
|
|
"valid_targets_min": 497
|
|
},
|
|
{
|
|
"epoch": 6.4186046511627906,
|
|
"grad_norm": 0.42788835357838334,
|
|
"learning_rate": 8.393065166211544e-07,
|
|
"loss": 0.1385,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1304156631231308,
|
|
"step": 4140,
|
|
"valid_targets_mean": 4457.7,
|
|
"valid_targets_min": 1134
|
|
},
|
|
{
|
|
"epoch": 6.426356589147287,
|
|
"grad_norm": 0.39619956994694927,
|
|
"learning_rate": 8.172852358361782e-07,
|
|
"loss": 0.1455,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1729072630405426,
|
|
"step": 4145,
|
|
"valid_targets_mean": 5565.4,
|
|
"valid_targets_min": 629
|
|
},
|
|
{
|
|
"epoch": 6.434108527131783,
|
|
"grad_norm": 0.4776261582174204,
|
|
"learning_rate": 7.955506734994922e-07,
|
|
"loss": 0.139,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17891857028007507,
|
|
"step": 4150,
|
|
"valid_targets_mean": 4085.9,
|
|
"valid_targets_min": 482
|
|
},
|
|
{
|
|
"epoch": 6.441860465116279,
|
|
"grad_norm": 0.4278671968152442,
|
|
"learning_rate": 7.741031544712663e-07,
|
|
"loss": 0.1358,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12771019339561462,
|
|
"step": 4155,
|
|
"valid_targets_mean": 4428.9,
|
|
"valid_targets_min": 479
|
|
},
|
|
{
|
|
"epoch": 6.449612403100775,
|
|
"grad_norm": 0.37776538158237155,
|
|
"learning_rate": 7.529429993213222e-07,
|
|
"loss": 0.1423,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12023401260375977,
|
|
"step": 4160,
|
|
"valid_targets_mean": 5098.1,
|
|
"valid_targets_min": 994
|
|
},
|
|
{
|
|
"epoch": 6.457364341085271,
|
|
"grad_norm": 0.43694272212869895,
|
|
"learning_rate": 7.320705243243287e-07,
|
|
"loss": 0.1405,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14688435196876526,
|
|
"step": 4165,
|
|
"valid_targets_mean": 5080.8,
|
|
"valid_targets_min": 675
|
|
},
|
|
{
|
|
"epoch": 6.465116279069767,
|
|
"grad_norm": 0.4225966998298987,
|
|
"learning_rate": 7.114860414550917e-07,
|
|
"loss": 0.1385,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14561529457569122,
|
|
"step": 4170,
|
|
"valid_targets_mean": 5137.9,
|
|
"valid_targets_min": 2089
|
|
},
|
|
{
|
|
"epoch": 6.4728682170542635,
|
|
"grad_norm": 0.4688876624797445,
|
|
"learning_rate": 6.911898583838738e-07,
|
|
"loss": 0.151,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15033042430877686,
|
|
"step": 4175,
|
|
"valid_targets_mean": 4029.8,
|
|
"valid_targets_min": 661
|
|
},
|
|
{
|
|
"epoch": 6.48062015503876,
|
|
"grad_norm": 0.4340667422133109,
|
|
"learning_rate": 6.711822784718158e-07,
|
|
"loss": 0.1515,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15977023541927338,
|
|
"step": 4180,
|
|
"valid_targets_mean": 4863.2,
|
|
"valid_targets_min": 2046
|
|
},
|
|
{
|
|
"epoch": 6.488372093023256,
|
|
"grad_norm": 0.4569382782087973,
|
|
"learning_rate": 6.5146360076638e-07,
|
|
"loss": 0.1623,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1681194007396698,
|
|
"step": 4185,
|
|
"valid_targets_mean": 4351.9,
|
|
"valid_targets_min": 315
|
|
},
|
|
{
|
|
"epoch": 6.496124031007752,
|
|
"grad_norm": 0.4554589036178452,
|
|
"learning_rate": 6.320341199968982e-07,
|
|
"loss": 0.1476,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15873485803604126,
|
|
"step": 4190,
|
|
"valid_targets_mean": 4564.2,
|
|
"valid_targets_min": 658
|
|
},
|
|
{
|
|
"epoch": 6.503875968992248,
|
|
"grad_norm": 0.49218409403445584,
|
|
"learning_rate": 6.128941265701627e-07,
|
|
"loss": 0.1387,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1481098085641861,
|
|
"step": 4195,
|
|
"valid_targets_mean": 3601.8,
|
|
"valid_targets_min": 352
|
|
},
|
|
{
|
|
"epoch": 6.511627906976744,
|
|
"grad_norm": 0.4096283466727092,
|
|
"learning_rate": 5.94043906566073e-07,
|
|
"loss": 0.1333,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13861069083213806,
|
|
"step": 4200,
|
|
"valid_targets_mean": 4857.5,
|
|
"valid_targets_min": 326
|
|
},
|
|
{
|
|
"epoch": 6.51937984496124,
|
|
"grad_norm": 0.46885200416042144,
|
|
"learning_rate": 5.754837417333781e-07,
|
|
"loss": 0.1389,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14652873575687408,
|
|
"step": 4205,
|
|
"valid_targets_mean": 3894.9,
|
|
"valid_targets_min": 906
|
|
},
|
|
{
|
|
"epoch": 6.5271317829457365,
|
|
"grad_norm": 0.3885968728101716,
|
|
"learning_rate": 5.572139094854478e-07,
|
|
"loss": 0.1482,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12030985951423645,
|
|
"step": 4210,
|
|
"valid_targets_mean": 4954.5,
|
|
"valid_targets_min": 2183
|
|
},
|
|
{
|
|
"epoch": 6.534883720930233,
|
|
"grad_norm": 0.37139089742268966,
|
|
"learning_rate": 5.392346828961504e-07,
|
|
"loss": 0.1401,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11080891638994217,
|
|
"step": 4215,
|
|
"valid_targets_mean": 5050.3,
|
|
"valid_targets_min": 298
|
|
},
|
|
{
|
|
"epoch": 6.542635658914729,
|
|
"grad_norm": 0.3853585068404549,
|
|
"learning_rate": 5.215463306957436e-07,
|
|
"loss": 0.1479,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13822655379772186,
|
|
"step": 4220,
|
|
"valid_targets_mean": 5455.0,
|
|
"valid_targets_min": 2416
|
|
},
|
|
{
|
|
"epoch": 6.550387596899225,
|
|
"grad_norm": 0.4726856345826331,
|
|
"learning_rate": 5.0414911726687e-07,
|
|
"loss": 0.1675,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22890380024909973,
|
|
"step": 4225,
|
|
"valid_targets_mean": 5294.4,
|
|
"valid_targets_min": 781
|
|
},
|
|
{
|
|
"epoch": 6.558139534883721,
|
|
"grad_norm": 0.4031349839399349,
|
|
"learning_rate": 4.870433026406152e-07,
|
|
"loss": 0.1508,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13684213161468506,
|
|
"step": 4230,
|
|
"valid_targets_mean": 4680.8,
|
|
"valid_targets_min": 2718
|
|
},
|
|
{
|
|
"epoch": 6.565891472868217,
|
|
"grad_norm": 0.48960339790783236,
|
|
"learning_rate": 4.7022914249260197e-07,
|
|
"loss": 0.1597,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1440485715866089,
|
|
"step": 4235,
|
|
"valid_targets_mean": 4090.7,
|
|
"valid_targets_min": 2062
|
|
},
|
|
{
|
|
"epoch": 6.573643410852713,
|
|
"grad_norm": 0.48029936611780594,
|
|
"learning_rate": 4.537068881391848e-07,
|
|
"loss": 0.138,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15450087189674377,
|
|
"step": 4240,
|
|
"valid_targets_mean": 3792.6,
|
|
"valid_targets_min": 2354
|
|
},
|
|
{
|
|
"epoch": 6.5813953488372094,
|
|
"grad_norm": 0.411026213138413,
|
|
"learning_rate": 4.37476786533686e-07,
|
|
"loss": 0.1413,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11528407782316208,
|
|
"step": 4245,
|
|
"valid_targets_mean": 5034.7,
|
|
"valid_targets_min": 682
|
|
},
|
|
{
|
|
"epoch": 6.589147286821706,
|
|
"grad_norm": 0.3613114304130289,
|
|
"learning_rate": 4.2153908026270504e-07,
|
|
"loss": 0.1404,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11450152099132538,
|
|
"step": 4250,
|
|
"valid_targets_mean": 5106.2,
|
|
"valid_targets_min": 3567
|
|
},
|
|
{
|
|
"epoch": 6.596899224806202,
|
|
"grad_norm": 0.49968357376260497,
|
|
"learning_rate": 4.058940075424933e-07,
|
|
"loss": 0.1505,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1560279130935669,
|
|
"step": 4255,
|
|
"valid_targets_mean": 4061.5,
|
|
"valid_targets_min": 2069
|
|
},
|
|
{
|
|
"epoch": 6.604651162790698,
|
|
"grad_norm": 0.46911068601775274,
|
|
"learning_rate": 3.9054180221539394e-07,
|
|
"loss": 0.1538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13993695378303528,
|
|
"step": 4260,
|
|
"valid_targets_mean": 3780.2,
|
|
"valid_targets_min": 790
|
|
},
|
|
{
|
|
"epoch": 6.612403100775194,
|
|
"grad_norm": 0.3917124798281757,
|
|
"learning_rate": 3.7548269374634736e-07,
|
|
"loss": 0.1344,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11809076368808746,
|
|
"step": 4265,
|
|
"valid_targets_mean": 4906.1,
|
|
"valid_targets_min": 253
|
|
},
|
|
{
|
|
"epoch": 6.62015503875969,
|
|
"grad_norm": 0.43882837837397076,
|
|
"learning_rate": 3.607169072194583e-07,
|
|
"loss": 0.1303,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13036519289016724,
|
|
"step": 4270,
|
|
"valid_targets_mean": 4900.6,
|
|
"valid_targets_min": 449
|
|
},
|
|
{
|
|
"epoch": 6.627906976744186,
|
|
"grad_norm": 0.3783203483240392,
|
|
"learning_rate": 3.4624466333464057e-07,
|
|
"loss": 0.1386,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13775168359279633,
|
|
"step": 4275,
|
|
"valid_targets_mean": 5567.1,
|
|
"valid_targets_min": 523
|
|
},
|
|
{
|
|
"epoch": 6.635658914728682,
|
|
"grad_norm": 0.3505902467720475,
|
|
"learning_rate": 3.320661784043e-07,
|
|
"loss": 0.1366,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11130744218826294,
|
|
"step": 4280,
|
|
"valid_targets_mean": 6773.1,
|
|
"valid_targets_min": 3288
|
|
},
|
|
{
|
|
"epoch": 6.6434108527131785,
|
|
"grad_norm": 0.4364368560735114,
|
|
"learning_rate": 3.1818166435012563e-07,
|
|
"loss": 0.1503,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15424305200576782,
|
|
"step": 4285,
|
|
"valid_targets_mean": 4766.6,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 6.651162790697675,
|
|
"grad_norm": 0.49428323333345386,
|
|
"learning_rate": 3.0459132869989914e-07,
|
|
"loss": 0.1635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17941808700561523,
|
|
"step": 4290,
|
|
"valid_targets_mean": 4228.8,
|
|
"valid_targets_min": 575
|
|
},
|
|
{
|
|
"epoch": 6.658914728682171,
|
|
"grad_norm": 0.4532498891303768,
|
|
"learning_rate": 2.912953745844083e-07,
|
|
"loss": 0.1603,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16425731778144836,
|
|
"step": 4295,
|
|
"valid_targets_mean": 4930.4,
|
|
"valid_targets_min": 512
|
|
},
|
|
{
|
|
"epoch": 6.666666666666667,
|
|
"grad_norm": 0.4484218818013772,
|
|
"learning_rate": 2.7829400073440704e-07,
|
|
"loss": 0.147,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14921866357326508,
|
|
"step": 4300,
|
|
"valid_targets_mean": 4864.6,
|
|
"valid_targets_min": 2160
|
|
},
|
|
{
|
|
"epoch": 6.674418604651163,
|
|
"grad_norm": 0.5128051450701466,
|
|
"learning_rate": 2.655874014776427e-07,
|
|
"loss": 0.1484,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19552041590213776,
|
|
"step": 4305,
|
|
"valid_targets_mean": 4560.8,
|
|
"valid_targets_min": 324
|
|
},
|
|
{
|
|
"epoch": 6.682170542635659,
|
|
"grad_norm": 0.39420076435511847,
|
|
"learning_rate": 2.531757667359491e-07,
|
|
"loss": 0.1343,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11401358246803284,
|
|
"step": 4310,
|
|
"valid_targets_mean": 5222.8,
|
|
"valid_targets_min": 2452
|
|
},
|
|
{
|
|
"epoch": 6.689922480620155,
|
|
"grad_norm": 0.39424587927802124,
|
|
"learning_rate": 2.4105928202241557e-07,
|
|
"loss": 0.1313,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10992264747619629,
|
|
"step": 4315,
|
|
"valid_targets_mean": 4744.0,
|
|
"valid_targets_min": 946
|
|
},
|
|
{
|
|
"epoch": 6.6976744186046515,
|
|
"grad_norm": 0.4909208750282455,
|
|
"learning_rate": 2.2923812843861136e-07,
|
|
"loss": 0.1569,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1754213571548462,
|
|
"step": 4320,
|
|
"valid_targets_mean": 4488.9,
|
|
"valid_targets_min": 267
|
|
},
|
|
{
|
|
"epoch": 6.705426356589148,
|
|
"grad_norm": 0.46076430916005,
|
|
"learning_rate": 2.1771248267186795e-07,
|
|
"loss": 0.1439,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15366077423095703,
|
|
"step": 4325,
|
|
"valid_targets_mean": 3990.3,
|
|
"valid_targets_min": 412
|
|
},
|
|
{
|
|
"epoch": 6.713178294573644,
|
|
"grad_norm": 0.44837990403963107,
|
|
"learning_rate": 2.064825169926632e-07,
|
|
"loss": 0.1436,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14431065320968628,
|
|
"step": 4330,
|
|
"valid_targets_mean": 4223.2,
|
|
"valid_targets_min": 1821
|
|
},
|
|
{
|
|
"epoch": 6.720930232558139,
|
|
"grad_norm": 0.3689938810371774,
|
|
"learning_rate": 1.9554839925201686e-07,
|
|
"loss": 0.1333,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16173899173736572,
|
|
"step": 4335,
|
|
"valid_targets_mean": 6193.9,
|
|
"valid_targets_min": 3050
|
|
},
|
|
{
|
|
"epoch": 6.728682170542635,
|
|
"grad_norm": 0.3834490175252527,
|
|
"learning_rate": 1.849102928790014e-07,
|
|
"loss": 0.1465,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15902329981327057,
|
|
"step": 4340,
|
|
"valid_targets_mean": 5950.6,
|
|
"valid_targets_min": 532
|
|
},
|
|
{
|
|
"epoch": 6.736434108527131,
|
|
"grad_norm": 0.3806645179110598,
|
|
"learning_rate": 1.74568356878293e-07,
|
|
"loss": 0.1431,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15495096147060394,
|
|
"step": 4345,
|
|
"valid_targets_mean": 5389.5,
|
|
"valid_targets_min": 2093
|
|
},
|
|
{
|
|
"epoch": 6.7441860465116275,
|
|
"grad_norm": 0.5001568087478473,
|
|
"learning_rate": 1.6452274582779537e-07,
|
|
"loss": 0.1494,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14459748566150665,
|
|
"step": 4350,
|
|
"valid_targets_mean": 4592.8,
|
|
"valid_targets_min": 555
|
|
},
|
|
{
|
|
"epoch": 6.751937984496124,
|
|
"grad_norm": 0.5854439307900624,
|
|
"learning_rate": 1.5477360987633305e-07,
|
|
"loss": 0.166,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19409656524658203,
|
|
"step": 4355,
|
|
"valid_targets_mean": 3547.4,
|
|
"valid_targets_min": 529
|
|
},
|
|
{
|
|
"epoch": 6.75968992248062,
|
|
"grad_norm": 0.4665900083114806,
|
|
"learning_rate": 1.453210947413952e-07,
|
|
"loss": 0.1467,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1850074976682663,
|
|
"step": 4360,
|
|
"valid_targets_mean": 4564.8,
|
|
"valid_targets_min": 540
|
|
},
|
|
{
|
|
"epoch": 6.767441860465116,
|
|
"grad_norm": 0.48350023695445227,
|
|
"learning_rate": 1.3616534170697747e-07,
|
|
"loss": 0.1539,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15944364666938782,
|
|
"step": 4365,
|
|
"valid_targets_mean": 3584.8,
|
|
"valid_targets_min": 263
|
|
},
|
|
{
|
|
"epoch": 6.775193798449612,
|
|
"grad_norm": 0.45038375032977,
|
|
"learning_rate": 1.2730648762144804e-07,
|
|
"loss": 0.1552,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18844370543956757,
|
|
"step": 4370,
|
|
"valid_targets_mean": 5290.8,
|
|
"valid_targets_min": 806
|
|
},
|
|
{
|
|
"epoch": 6.782945736434108,
|
|
"grad_norm": 0.4134945839078117,
|
|
"learning_rate": 1.1874466489551817e-07,
|
|
"loss": 0.1408,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15977919101715088,
|
|
"step": 4375,
|
|
"valid_targets_mean": 4978.0,
|
|
"valid_targets_min": 325
|
|
},
|
|
{
|
|
"epoch": 6.790697674418604,
|
|
"grad_norm": 0.40450500367697456,
|
|
"learning_rate": 1.1048000150025939e-07,
|
|
"loss": 0.1453,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13722053170204163,
|
|
"step": 4380,
|
|
"valid_targets_mean": 4658.6,
|
|
"valid_targets_min": 3135
|
|
},
|
|
{
|
|
"epoch": 6.7984496124031,
|
|
"grad_norm": 0.41715346551607424,
|
|
"learning_rate": 1.0251262096518499e-07,
|
|
"loss": 0.1402,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10508380830287933,
|
|
"step": 4385,
|
|
"valid_targets_mean": 4255.1,
|
|
"valid_targets_min": 250
|
|
},
|
|
{
|
|
"epoch": 6.8062015503875966,
|
|
"grad_norm": 0.5216272062569919,
|
|
"learning_rate": 9.484264237641372e-08,
|
|
"loss": 0.1549,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21273067593574524,
|
|
"step": 4390,
|
|
"valid_targets_mean": 4022.2,
|
|
"valid_targets_min": 608
|
|
},
|
|
{
|
|
"epoch": 6.813953488372093,
|
|
"grad_norm": 0.39630599414920137,
|
|
"learning_rate": 8.747018037488009e-08,
|
|
"loss": 0.1337,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12072727829217911,
|
|
"step": 4395,
|
|
"valid_targets_mean": 4854.1,
|
|
"valid_targets_min": 233
|
|
},
|
|
{
|
|
"epoch": 6.821705426356589,
|
|
"grad_norm": 0.4277418685702825,
|
|
"learning_rate": 8.039534515462244e-08,
|
|
"loss": 0.129,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11388542503118515,
|
|
"step": 4400,
|
|
"valid_targets_mean": 4361.8,
|
|
"valid_targets_min": 821
|
|
},
|
|
{
|
|
"epoch": 6.829457364341085,
|
|
"grad_norm": 0.38765433024613494,
|
|
"learning_rate": 7.361824246114424e-08,
|
|
"loss": 0.1309,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13917176425457,
|
|
"step": 4405,
|
|
"valid_targets_mean": 5343.9,
|
|
"valid_targets_min": 1942
|
|
},
|
|
{
|
|
"epoch": 6.837209302325581,
|
|
"grad_norm": 0.34398297746177137,
|
|
"learning_rate": 6.713897358982202e-08,
|
|
"loss": 0.1493,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.113133504986763,
|
|
"step": 4410,
|
|
"valid_targets_mean": 5645.0,
|
|
"valid_targets_min": 678
|
|
},
|
|
{
|
|
"epoch": 6.844961240310077,
|
|
"grad_norm": 0.48279011534912997,
|
|
"learning_rate": 6.095763538440214e-08,
|
|
"loss": 0.1492,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12714777886867523,
|
|
"step": 4415,
|
|
"valid_targets_mean": 3936.2,
|
|
"valid_targets_min": 216
|
|
},
|
|
{
|
|
"epoch": 6.852713178294573,
|
|
"grad_norm": 0.4180463055838533,
|
|
"learning_rate": 5.507432023554637e-08,
|
|
"loss": 0.1469,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1416483223438263,
|
|
"step": 4420,
|
|
"valid_targets_mean": 4545.9,
|
|
"valid_targets_min": 1037
|
|
},
|
|
{
|
|
"epoch": 6.8604651162790695,
|
|
"grad_norm": 0.4294181180018212,
|
|
"learning_rate": 4.948911607945084e-08,
|
|
"loss": 0.1531,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19967518746852875,
|
|
"step": 4425,
|
|
"valid_targets_mean": 5607.9,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 6.868217054263566,
|
|
"grad_norm": 0.3477503979746384,
|
|
"learning_rate": 4.420210639653366e-08,
|
|
"loss": 0.1297,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1086292415857315,
|
|
"step": 4430,
|
|
"valid_targets_mean": 5510.9,
|
|
"valid_targets_min": 2659
|
|
},
|
|
{
|
|
"epoch": 6.875968992248062,
|
|
"grad_norm": 0.41768003376691165,
|
|
"learning_rate": 3.921337021018934e-08,
|
|
"loss": 0.1403,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1428183615207672,
|
|
"step": 4435,
|
|
"valid_targets_mean": 5068.1,
|
|
"valid_targets_min": 459
|
|
},
|
|
{
|
|
"epoch": 6.883720930232558,
|
|
"grad_norm": 0.490921604098694,
|
|
"learning_rate": 3.452298208560301e-08,
|
|
"loss": 0.1374,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17244720458984375,
|
|
"step": 4440,
|
|
"valid_targets_mean": 4010.2,
|
|
"valid_targets_min": 669
|
|
},
|
|
{
|
|
"epoch": 6.891472868217054,
|
|
"grad_norm": 0.36536468948119627,
|
|
"learning_rate": 3.0131012128642445e-08,
|
|
"loss": 0.1521,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11829351633787155,
|
|
"step": 4445,
|
|
"valid_targets_mean": 5238.6,
|
|
"valid_targets_min": 573
|
|
},
|
|
{
|
|
"epoch": 6.89922480620155,
|
|
"grad_norm": 0.43543485475431953,
|
|
"learning_rate": 2.6037525984798918e-08,
|
|
"loss": 0.1592,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14736925065517426,
|
|
"step": 4450,
|
|
"valid_targets_mean": 4508.6,
|
|
"valid_targets_min": 2594
|
|
},
|
|
{
|
|
"epoch": 6.906976744186046,
|
|
"grad_norm": 0.457191809542186,
|
|
"learning_rate": 2.2242584838219062e-08,
|
|
"loss": 0.1419,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1291424185037613,
|
|
"step": 4455,
|
|
"valid_targets_mean": 4140.1,
|
|
"valid_targets_min": 363
|
|
},
|
|
{
|
|
"epoch": 6.9147286821705425,
|
|
"grad_norm": 0.3441924236982618,
|
|
"learning_rate": 1.8746245410781184e-08,
|
|
"loss": 0.1402,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09382060170173645,
|
|
"step": 4460,
|
|
"valid_targets_mean": 5934.2,
|
|
"valid_targets_min": 2203
|
|
},
|
|
{
|
|
"epoch": 6.922480620155039,
|
|
"grad_norm": 0.46978533968904,
|
|
"learning_rate": 1.5548559961253707e-08,
|
|
"loss": 0.1517,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16701874136924744,
|
|
"step": 4465,
|
|
"valid_targets_mean": 4124.2,
|
|
"valid_targets_min": 435
|
|
},
|
|
{
|
|
"epoch": 6.930232558139535,
|
|
"grad_norm": 0.45884185400938543,
|
|
"learning_rate": 1.2649576284509135e-08,
|
|
"loss": 0.1654,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15522664785385132,
|
|
"step": 4470,
|
|
"valid_targets_mean": 4735.6,
|
|
"valid_targets_min": 748
|
|
},
|
|
{
|
|
"epoch": 6.937984496124031,
|
|
"grad_norm": 0.37304600716915987,
|
|
"learning_rate": 1.004933771080907e-08,
|
|
"loss": 0.1585,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15063238143920898,
|
|
"step": 4475,
|
|
"valid_targets_mean": 5812.3,
|
|
"valid_targets_min": 1844
|
|
},
|
|
{
|
|
"epoch": 6.945736434108527,
|
|
"grad_norm": 0.4417268532948254,
|
|
"learning_rate": 7.747883105166942e-09,
|
|
"loss": 0.1483,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12845158576965332,
|
|
"step": 4480,
|
|
"valid_targets_mean": 3979.6,
|
|
"valid_targets_min": 329
|
|
},
|
|
{
|
|
"epoch": 6.953488372093023,
|
|
"grad_norm": 0.4206373369632711,
|
|
"learning_rate": 5.745246866748489e-09,
|
|
"loss": 0.1433,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1285676211118698,
|
|
"step": 4485,
|
|
"valid_targets_mean": 4420.4,
|
|
"valid_targets_min": 864
|
|
},
|
|
{
|
|
"epoch": 6.961240310077519,
|
|
"grad_norm": 0.409189864441095,
|
|
"learning_rate": 4.041458928378816e-09,
|
|
"loss": 0.1433,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13274972140789032,
|
|
"step": 4490,
|
|
"valid_targets_mean": 5082.7,
|
|
"valid_targets_min": 2020
|
|
},
|
|
{
|
|
"epoch": 6.9689922480620154,
|
|
"grad_norm": 0.7633572465865676,
|
|
"learning_rate": 2.6365447560761093e-09,
|
|
"loss": 0.1471,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1332360953092575,
|
|
"step": 4495,
|
|
"valid_targets_mean": 3844.5,
|
|
"valid_targets_min": 300
|
|
},
|
|
{
|
|
"epoch": 6.976744186046512,
|
|
"grad_norm": 0.4810580142176617,
|
|
"learning_rate": 1.5305253486852523e-09,
|
|
"loss": 0.1431,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16817598044872284,
|
|
"step": 4500,
|
|
"valid_targets_mean": 4177.8,
|
|
"valid_targets_min": 529
|
|
},
|
|
{
|
|
"epoch": 6.984496124031008,
|
|
"grad_norm": 0.4276342091229402,
|
|
"learning_rate": 7.234172375558679e-10,
|
|
"loss": 0.1495,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13658341765403748,
|
|
"step": 4505,
|
|
"valid_targets_mean": 4540.3,
|
|
"valid_targets_min": 1720
|
|
},
|
|
{
|
|
"epoch": 6.992248062015504,
|
|
"grad_norm": 0.41945236764032184,
|
|
"learning_rate": 2.1523248629806703e-10,
|
|
"loss": 0.1521,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14896142482757568,
|
|
"step": 4510,
|
|
"valid_targets_mean": 4939.6,
|
|
"valid_targets_min": 694
|
|
},
|
|
{
|
|
"epoch": 7.0,
|
|
"grad_norm": 0.4017760557242996,
|
|
"learning_rate": 5.978690600372261e-12,
|
|
"loss": 0.1386,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12985655665397644,
|
|
"step": 4515,
|
|
"valid_targets_mean": 5961.6,
|
|
"valid_targets_min": 2002
|
|
},
|
|
{
|
|
"epoch": 7.0,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12985655665397644,
|
|
"step": 4515,
|
|
"total_flos": 1219521762033664.0,
|
|
"train_loss": 0.10701951415567831,
|
|
"train_runtime": 13204.5072,
|
|
"train_samples_per_second": 5.464,
|
|
"train_steps_per_second": 0.342,
|
|
"valid_targets_mean": 5961.6,
|
|
"valid_targets_min": 2002
|
|
}
|
|
],
|
|
"logging_steps": 5,
|
|
"max_steps": 4515,
|
|
"num_input_tokens_seen": 0,
|
|
"num_train_epochs": 7,
|
|
"save_steps": 1500,
|
|
"stateful_callbacks": {
|
|
"TrainerControl": {
|
|
"args": {
|
|
"should_epoch_stop": false,
|
|
"should_evaluate": false,
|
|
"should_log": false,
|
|
"should_save": true,
|
|
"should_training_stop": true
|
|
},
|
|
"attributes": {}
|
|
}
|
|
},
|
|
"total_flos": 1219521762033664.0,
|
|
"train_batch_size": 1,
|
|
"trial_name": null,
|
|
"trial_params": null
|
|
}
|