10641 lines
295 KiB
JSON
10641 lines
295 KiB
JSON
{
|
|
"best_global_step": null,
|
|
"best_metric": null,
|
|
"best_model_checkpoint": null,
|
|
"epoch": 7.0,
|
|
"eval_steps": 500,
|
|
"global_step": 4816,
|
|
"is_hyper_param_search": false,
|
|
"is_local_process_zero": true,
|
|
"is_world_process_zero": true,
|
|
"log_history": [
|
|
{
|
|
"epoch": 0.007267441860465116,
|
|
"grad_norm": 23.60395367303308,
|
|
"learning_rate": 3.319502074688797e-07,
|
|
"loss": 0.8619,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.36206579208374023,
|
|
"step": 5,
|
|
"valid_targets_mean": 3788.0,
|
|
"valid_targets_min": 735
|
|
},
|
|
{
|
|
"epoch": 0.014534883720930232,
|
|
"grad_norm": 23.282874067744043,
|
|
"learning_rate": 7.468879668049793e-07,
|
|
"loss": 0.88,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.34413787722587585,
|
|
"step": 10,
|
|
"valid_targets_mean": 3052.0,
|
|
"valid_targets_min": 514
|
|
},
|
|
{
|
|
"epoch": 0.02180232558139535,
|
|
"grad_norm": 20.544843116221944,
|
|
"learning_rate": 1.161825726141079e-06,
|
|
"loss": 0.8461,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.37611252069473267,
|
|
"step": 15,
|
|
"valid_targets_mean": 4375.6,
|
|
"valid_targets_min": 629
|
|
},
|
|
{
|
|
"epoch": 0.029069767441860465,
|
|
"grad_norm": 15.377437328665666,
|
|
"learning_rate": 1.5767634854771784e-06,
|
|
"loss": 0.7898,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3731459975242615,
|
|
"step": 20,
|
|
"valid_targets_mean": 5467.6,
|
|
"valid_targets_min": 3940
|
|
},
|
|
{
|
|
"epoch": 0.036337209302325583,
|
|
"grad_norm": 9.747878208294727,
|
|
"learning_rate": 1.991701244813278e-06,
|
|
"loss": 0.7522,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.41458815336227417,
|
|
"step": 25,
|
|
"valid_targets_mean": 3558.1,
|
|
"valid_targets_min": 703
|
|
},
|
|
{
|
|
"epoch": 0.0436046511627907,
|
|
"grad_norm": 5.1933038029969305,
|
|
"learning_rate": 2.4066390041493776e-06,
|
|
"loss": 0.6776,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.32391414046287537,
|
|
"step": 30,
|
|
"valid_targets_mean": 2797.5,
|
|
"valid_targets_min": 758
|
|
},
|
|
{
|
|
"epoch": 0.050872093023255814,
|
|
"grad_norm": 2.9153373109793437,
|
|
"learning_rate": 2.8215767634854773e-06,
|
|
"loss": 0.647,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.35981929302215576,
|
|
"step": 35,
|
|
"valid_targets_mean": 4440.8,
|
|
"valid_targets_min": 874
|
|
},
|
|
{
|
|
"epoch": 0.05813953488372093,
|
|
"grad_norm": 1.9464734332413474,
|
|
"learning_rate": 3.2365145228215773e-06,
|
|
"loss": 0.6368,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.297600120306015,
|
|
"step": 40,
|
|
"valid_targets_mean": 4015.2,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 0.06540697674418605,
|
|
"grad_norm": 1.5811509244863968,
|
|
"learning_rate": 3.6514522821576765e-06,
|
|
"loss": 0.6042,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.235577791929245,
|
|
"step": 45,
|
|
"valid_targets_mean": 3494.8,
|
|
"valid_targets_min": 676
|
|
},
|
|
{
|
|
"epoch": 0.07267441860465117,
|
|
"grad_norm": 1.6191035025819336,
|
|
"learning_rate": 4.0663900414937765e-06,
|
|
"loss": 0.6092,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.3790181875228882,
|
|
"step": 50,
|
|
"valid_targets_mean": 2875.0,
|
|
"valid_targets_min": 743
|
|
},
|
|
{
|
|
"epoch": 0.07994186046511628,
|
|
"grad_norm": 1.2139651902387136,
|
|
"learning_rate": 4.481327800829876e-06,
|
|
"loss": 0.5623,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23523655533790588,
|
|
"step": 55,
|
|
"valid_targets_mean": 2952.5,
|
|
"valid_targets_min": 634
|
|
},
|
|
{
|
|
"epoch": 0.0872093023255814,
|
|
"grad_norm": 1.107547629402263,
|
|
"learning_rate": 4.896265560165976e-06,
|
|
"loss": 0.5582,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24975699186325073,
|
|
"step": 60,
|
|
"valid_targets_mean": 2733.1,
|
|
"valid_targets_min": 557
|
|
},
|
|
{
|
|
"epoch": 0.09447674418604651,
|
|
"grad_norm": 0.8171060334267412,
|
|
"learning_rate": 5.311203319502075e-06,
|
|
"loss": 0.5279,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2179132103919983,
|
|
"step": 65,
|
|
"valid_targets_mean": 3514.1,
|
|
"valid_targets_min": 728
|
|
},
|
|
{
|
|
"epoch": 0.10174418604651163,
|
|
"grad_norm": 0.8445616203520336,
|
|
"learning_rate": 5.726141078838174e-06,
|
|
"loss": 0.5329,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22933122515678406,
|
|
"step": 70,
|
|
"valid_targets_mean": 2726.6,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 0.10901162790697674,
|
|
"grad_norm": 0.7363370039191905,
|
|
"learning_rate": 6.1410788381742745e-06,
|
|
"loss": 0.4821,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2222234010696411,
|
|
"step": 75,
|
|
"valid_targets_mean": 4008.4,
|
|
"valid_targets_min": 580
|
|
},
|
|
{
|
|
"epoch": 0.11627906976744186,
|
|
"grad_norm": 0.6626607153866264,
|
|
"learning_rate": 6.556016597510374e-06,
|
|
"loss": 0.4768,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1906505525112152,
|
|
"step": 80,
|
|
"valid_targets_mean": 4183.4,
|
|
"valid_targets_min": 560
|
|
},
|
|
{
|
|
"epoch": 0.12354651162790697,
|
|
"grad_norm": 0.7275647245598297,
|
|
"learning_rate": 6.970954356846473e-06,
|
|
"loss": 0.4808,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23446953296661377,
|
|
"step": 85,
|
|
"valid_targets_mean": 4184.1,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 0.1308139534883721,
|
|
"grad_norm": 0.6302365183817711,
|
|
"learning_rate": 7.385892116182573e-06,
|
|
"loss": 0.4469,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22797903418540955,
|
|
"step": 90,
|
|
"valid_targets_mean": 5058.5,
|
|
"valid_targets_min": 3750
|
|
},
|
|
{
|
|
"epoch": 0.1380813953488372,
|
|
"grad_norm": 0.6928723527565587,
|
|
"learning_rate": 7.800829875518673e-06,
|
|
"loss": 0.4533,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23440513014793396,
|
|
"step": 95,
|
|
"valid_targets_mean": 3689.2,
|
|
"valid_targets_min": 713
|
|
},
|
|
{
|
|
"epoch": 0.14534883720930233,
|
|
"grad_norm": 0.9242860696284508,
|
|
"learning_rate": 8.215767634854772e-06,
|
|
"loss": 0.4457,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24846482276916504,
|
|
"step": 100,
|
|
"valid_targets_mean": 3255.8,
|
|
"valid_targets_min": 597
|
|
},
|
|
{
|
|
"epoch": 0.15261627906976744,
|
|
"grad_norm": 0.6413774191381949,
|
|
"learning_rate": 8.630705394190872e-06,
|
|
"loss": 0.4474,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19246378540992737,
|
|
"step": 105,
|
|
"valid_targets_mean": 3996.2,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 0.15988372093023256,
|
|
"grad_norm": 0.6894681865347022,
|
|
"learning_rate": 9.045643153526971e-06,
|
|
"loss": 0.4288,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19999036192893982,
|
|
"step": 110,
|
|
"valid_targets_mean": 3380.1,
|
|
"valid_targets_min": 629
|
|
},
|
|
{
|
|
"epoch": 0.16715116279069767,
|
|
"grad_norm": 0.7022454218409497,
|
|
"learning_rate": 9.460580912863071e-06,
|
|
"loss": 0.4541,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16242238879203796,
|
|
"step": 115,
|
|
"valid_targets_mean": 3007.4,
|
|
"valid_targets_min": 712
|
|
},
|
|
{
|
|
"epoch": 0.1744186046511628,
|
|
"grad_norm": 0.6253461021305736,
|
|
"learning_rate": 9.875518672199172e-06,
|
|
"loss": 0.4304,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14945435523986816,
|
|
"step": 120,
|
|
"valid_targets_mean": 3177.5,
|
|
"valid_targets_min": 819
|
|
},
|
|
{
|
|
"epoch": 0.1816860465116279,
|
|
"grad_norm": 0.7018027456233442,
|
|
"learning_rate": 1.0290456431535269e-05,
|
|
"loss": 0.41,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17015759646892548,
|
|
"step": 125,
|
|
"valid_targets_mean": 2437.5,
|
|
"valid_targets_min": 339
|
|
},
|
|
{
|
|
"epoch": 0.18895348837209303,
|
|
"grad_norm": 0.8319196430142065,
|
|
"learning_rate": 1.070539419087137e-05,
|
|
"loss": 0.4158,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.206083744764328,
|
|
"step": 130,
|
|
"valid_targets_mean": 3995.8,
|
|
"valid_targets_min": 667
|
|
},
|
|
{
|
|
"epoch": 0.19622093023255813,
|
|
"grad_norm": 0.5700530676300132,
|
|
"learning_rate": 1.112033195020747e-05,
|
|
"loss": 0.3866,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23243868350982666,
|
|
"step": 135,
|
|
"valid_targets_mean": 5856.1,
|
|
"valid_targets_min": 3495
|
|
},
|
|
{
|
|
"epoch": 0.20348837209302326,
|
|
"grad_norm": 0.7259992884453891,
|
|
"learning_rate": 1.1535269709543569e-05,
|
|
"loss": 0.3935,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19784843921661377,
|
|
"step": 140,
|
|
"valid_targets_mean": 2655.4,
|
|
"valid_targets_min": 612
|
|
},
|
|
{
|
|
"epoch": 0.21075581395348839,
|
|
"grad_norm": 0.5805199736360525,
|
|
"learning_rate": 1.1950207468879669e-05,
|
|
"loss": 0.3836,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17293311655521393,
|
|
"step": 145,
|
|
"valid_targets_mean": 4135.4,
|
|
"valid_targets_min": 855
|
|
},
|
|
{
|
|
"epoch": 0.2180232558139535,
|
|
"grad_norm": 0.7106827535386514,
|
|
"learning_rate": 1.236514522821577e-05,
|
|
"loss": 0.3918,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2059229165315628,
|
|
"step": 150,
|
|
"valid_targets_mean": 4109.1,
|
|
"valid_targets_min": 1018
|
|
},
|
|
{
|
|
"epoch": 0.22529069767441862,
|
|
"grad_norm": 0.6454809853641186,
|
|
"learning_rate": 1.2780082987551867e-05,
|
|
"loss": 0.3847,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16915945708751678,
|
|
"step": 155,
|
|
"valid_targets_mean": 3834.5,
|
|
"valid_targets_min": 429
|
|
},
|
|
{
|
|
"epoch": 0.23255813953488372,
|
|
"grad_norm": 0.7811620851477677,
|
|
"learning_rate": 1.3195020746887967e-05,
|
|
"loss": 0.387,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17152553796768188,
|
|
"step": 160,
|
|
"valid_targets_mean": 2061.4,
|
|
"valid_targets_min": 572
|
|
},
|
|
{
|
|
"epoch": 0.23982558139534885,
|
|
"grad_norm": 0.6473284356559537,
|
|
"learning_rate": 1.3609958506224067e-05,
|
|
"loss": 0.3834,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16540473699569702,
|
|
"step": 165,
|
|
"valid_targets_mean": 3449.9,
|
|
"valid_targets_min": 512
|
|
},
|
|
{
|
|
"epoch": 0.24709302325581395,
|
|
"grad_norm": 0.6625475101770146,
|
|
"learning_rate": 1.4024896265560166e-05,
|
|
"loss": 0.3975,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19903941452503204,
|
|
"step": 170,
|
|
"valid_targets_mean": 4140.4,
|
|
"valid_targets_min": 677
|
|
},
|
|
{
|
|
"epoch": 0.2543604651162791,
|
|
"grad_norm": 0.6564466177734336,
|
|
"learning_rate": 1.4439834024896267e-05,
|
|
"loss": 0.3808,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14273467659950256,
|
|
"step": 175,
|
|
"valid_targets_mean": 2623.4,
|
|
"valid_targets_min": 717
|
|
},
|
|
{
|
|
"epoch": 0.2616279069767442,
|
|
"grad_norm": 0.7554600141788899,
|
|
"learning_rate": 1.4854771784232367e-05,
|
|
"loss": 0.3775,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19581112265586853,
|
|
"step": 180,
|
|
"valid_targets_mean": 3290.1,
|
|
"valid_targets_min": 594
|
|
},
|
|
{
|
|
"epoch": 0.2688953488372093,
|
|
"grad_norm": 0.8137765108506549,
|
|
"learning_rate": 1.5269709543568464e-05,
|
|
"loss": 0.3938,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20833677053451538,
|
|
"step": 185,
|
|
"valid_targets_mean": 2977.4,
|
|
"valid_targets_min": 789
|
|
},
|
|
{
|
|
"epoch": 0.2761627906976744,
|
|
"grad_norm": 0.819634775218101,
|
|
"learning_rate": 1.5684647302904566e-05,
|
|
"loss": 0.383,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2356613427400589,
|
|
"step": 190,
|
|
"valid_targets_mean": 3226.0,
|
|
"valid_targets_min": 659
|
|
},
|
|
{
|
|
"epoch": 0.28343023255813954,
|
|
"grad_norm": 0.6515391834585635,
|
|
"learning_rate": 1.6099585062240665e-05,
|
|
"loss": 0.3812,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.171596497297287,
|
|
"step": 195,
|
|
"valid_targets_mean": 3689.6,
|
|
"valid_targets_min": 638
|
|
},
|
|
{
|
|
"epoch": 0.29069767441860467,
|
|
"grad_norm": 0.6568499242368925,
|
|
"learning_rate": 1.6514522821576764e-05,
|
|
"loss": 0.3761,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1820891797542572,
|
|
"step": 200,
|
|
"valid_targets_mean": 3843.2,
|
|
"valid_targets_min": 631
|
|
},
|
|
{
|
|
"epoch": 0.29796511627906974,
|
|
"grad_norm": 0.7472077453103736,
|
|
"learning_rate": 1.6929460580912863e-05,
|
|
"loss": 0.3862,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2648097276687622,
|
|
"step": 205,
|
|
"valid_targets_mean": 3722.5,
|
|
"valid_targets_min": 666
|
|
},
|
|
{
|
|
"epoch": 0.30523255813953487,
|
|
"grad_norm": 0.877924169905687,
|
|
"learning_rate": 1.7344398340248965e-05,
|
|
"loss": 0.373,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.24992845952510834,
|
|
"step": 210,
|
|
"valid_targets_mean": 2855.9,
|
|
"valid_targets_min": 506
|
|
},
|
|
{
|
|
"epoch": 0.3125,
|
|
"grad_norm": 0.8416781774626408,
|
|
"learning_rate": 1.7759336099585064e-05,
|
|
"loss": 0.3787,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22990360856056213,
|
|
"step": 215,
|
|
"valid_targets_mean": 3118.4,
|
|
"valid_targets_min": 800
|
|
},
|
|
{
|
|
"epoch": 0.31976744186046513,
|
|
"grad_norm": 0.6566273438654435,
|
|
"learning_rate": 1.8174273858921162e-05,
|
|
"loss": 0.3952,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14994342625141144,
|
|
"step": 220,
|
|
"valid_targets_mean": 3124.2,
|
|
"valid_targets_min": 572
|
|
},
|
|
{
|
|
"epoch": 0.32703488372093026,
|
|
"grad_norm": 0.6550126195062852,
|
|
"learning_rate": 1.8589211618257264e-05,
|
|
"loss": 0.3555,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1906970590353012,
|
|
"step": 225,
|
|
"valid_targets_mean": 3964.2,
|
|
"valid_targets_min": 954
|
|
},
|
|
{
|
|
"epoch": 0.33430232558139533,
|
|
"grad_norm": 0.6948624664412582,
|
|
"learning_rate": 1.9004149377593363e-05,
|
|
"loss": 0.3649,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2098342776298523,
|
|
"step": 230,
|
|
"valid_targets_mean": 3855.0,
|
|
"valid_targets_min": 297
|
|
},
|
|
{
|
|
"epoch": 0.34156976744186046,
|
|
"grad_norm": 0.694830010463169,
|
|
"learning_rate": 1.9419087136929462e-05,
|
|
"loss": 0.3644,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2014472782611847,
|
|
"step": 235,
|
|
"valid_targets_mean": 4444.5,
|
|
"valid_targets_min": 559
|
|
},
|
|
{
|
|
"epoch": 0.3488372093023256,
|
|
"grad_norm": 0.7125029122579649,
|
|
"learning_rate": 1.983402489626556e-05,
|
|
"loss": 0.3588,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1556605100631714,
|
|
"step": 240,
|
|
"valid_targets_mean": 3346.0,
|
|
"valid_targets_min": 516
|
|
},
|
|
{
|
|
"epoch": 0.3561046511627907,
|
|
"grad_norm": 0.6714853403607605,
|
|
"learning_rate": 2.024896265560166e-05,
|
|
"loss": 0.3635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19688832759857178,
|
|
"step": 245,
|
|
"valid_targets_mean": 4349.2,
|
|
"valid_targets_min": 694
|
|
},
|
|
{
|
|
"epoch": 0.3633720930232558,
|
|
"grad_norm": 0.6799567905357822,
|
|
"learning_rate": 2.066390041493776e-05,
|
|
"loss": 0.3641,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14497721195220947,
|
|
"step": 250,
|
|
"valid_targets_mean": 3314.5,
|
|
"valid_targets_min": 803
|
|
},
|
|
{
|
|
"epoch": 0.3706395348837209,
|
|
"grad_norm": 0.7202375378999366,
|
|
"learning_rate": 2.107883817427386e-05,
|
|
"loss": 0.3509,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18096783757209778,
|
|
"step": 255,
|
|
"valid_targets_mean": 3134.6,
|
|
"valid_targets_min": 562
|
|
},
|
|
{
|
|
"epoch": 0.37790697674418605,
|
|
"grad_norm": 0.6155035214731711,
|
|
"learning_rate": 2.149377593360996e-05,
|
|
"loss": 0.3543,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1524481177330017,
|
|
"step": 260,
|
|
"valid_targets_mean": 3271.9,
|
|
"valid_targets_min": 305
|
|
},
|
|
{
|
|
"epoch": 0.3851744186046512,
|
|
"grad_norm": 0.6335191320342396,
|
|
"learning_rate": 2.190871369294606e-05,
|
|
"loss": 0.3378,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19276472926139832,
|
|
"step": 265,
|
|
"valid_targets_mean": 4571.8,
|
|
"valid_targets_min": 805
|
|
},
|
|
{
|
|
"epoch": 0.39244186046511625,
|
|
"grad_norm": 0.6827322142507465,
|
|
"learning_rate": 2.232365145228216e-05,
|
|
"loss": 0.3526,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18056687712669373,
|
|
"step": 270,
|
|
"valid_targets_mean": 3713.2,
|
|
"valid_targets_min": 576
|
|
},
|
|
{
|
|
"epoch": 0.3997093023255814,
|
|
"grad_norm": 0.6937020874439587,
|
|
"learning_rate": 2.273858921161826e-05,
|
|
"loss": 0.3786,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19584697484970093,
|
|
"step": 275,
|
|
"valid_targets_mean": 4246.0,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 0.4069767441860465,
|
|
"grad_norm": 0.7507183101664987,
|
|
"learning_rate": 2.315352697095436e-05,
|
|
"loss": 0.3594,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16600695252418518,
|
|
"step": 280,
|
|
"valid_targets_mean": 2664.1,
|
|
"valid_targets_min": 704
|
|
},
|
|
{
|
|
"epoch": 0.41424418604651164,
|
|
"grad_norm": 0.6156181535415471,
|
|
"learning_rate": 2.356846473029046e-05,
|
|
"loss": 0.3452,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1752406358718872,
|
|
"step": 285,
|
|
"valid_targets_mean": 3996.6,
|
|
"valid_targets_min": 540
|
|
},
|
|
{
|
|
"epoch": 0.42151162790697677,
|
|
"grad_norm": 0.6532054067762535,
|
|
"learning_rate": 2.398340248962656e-05,
|
|
"loss": 0.3384,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15145818889141083,
|
|
"step": 290,
|
|
"valid_targets_mean": 4135.5,
|
|
"valid_targets_min": 799
|
|
},
|
|
{
|
|
"epoch": 0.42877906976744184,
|
|
"grad_norm": 0.6821518031591993,
|
|
"learning_rate": 2.439834024896266e-05,
|
|
"loss": 0.3506,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13307440280914307,
|
|
"step": 295,
|
|
"valid_targets_mean": 2559.9,
|
|
"valid_targets_min": 770
|
|
},
|
|
{
|
|
"epoch": 0.436046511627907,
|
|
"grad_norm": 0.6168836807757696,
|
|
"learning_rate": 2.481327800829876e-05,
|
|
"loss": 0.3305,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1336684226989746,
|
|
"step": 300,
|
|
"valid_targets_mean": 3724.6,
|
|
"valid_targets_min": 650
|
|
},
|
|
{
|
|
"epoch": 0.4433139534883721,
|
|
"grad_norm": 0.7333001387424685,
|
|
"learning_rate": 2.5228215767634855e-05,
|
|
"loss": 0.3556,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15666671097278595,
|
|
"step": 305,
|
|
"valid_targets_mean": 2321.0,
|
|
"valid_targets_min": 867
|
|
},
|
|
{
|
|
"epoch": 0.45058139534883723,
|
|
"grad_norm": 0.6581684280891332,
|
|
"learning_rate": 2.5643153526970957e-05,
|
|
"loss": 0.3537,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17739339172840118,
|
|
"step": 310,
|
|
"valid_targets_mean": 3477.4,
|
|
"valid_targets_min": 552
|
|
},
|
|
{
|
|
"epoch": 0.4578488372093023,
|
|
"grad_norm": 0.6691702027150105,
|
|
"learning_rate": 2.6058091286307056e-05,
|
|
"loss": 0.3433,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14868199825286865,
|
|
"step": 315,
|
|
"valid_targets_mean": 2954.4,
|
|
"valid_targets_min": 571
|
|
},
|
|
{
|
|
"epoch": 0.46511627906976744,
|
|
"grad_norm": 0.7240436681213814,
|
|
"learning_rate": 2.6473029045643155e-05,
|
|
"loss": 0.3346,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19649548828601837,
|
|
"step": 320,
|
|
"valid_targets_mean": 3651.5,
|
|
"valid_targets_min": 649
|
|
},
|
|
{
|
|
"epoch": 0.47238372093023256,
|
|
"grad_norm": 0.6691805651498327,
|
|
"learning_rate": 2.6887966804979257e-05,
|
|
"loss": 0.3331,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18201938271522522,
|
|
"step": 325,
|
|
"valid_targets_mean": 4133.5,
|
|
"valid_targets_min": 625
|
|
},
|
|
{
|
|
"epoch": 0.4796511627906977,
|
|
"grad_norm": 0.6386940655448596,
|
|
"learning_rate": 2.7302904564315355e-05,
|
|
"loss": 0.3464,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17419925332069397,
|
|
"step": 330,
|
|
"valid_targets_mean": 4157.8,
|
|
"valid_targets_min": 790
|
|
},
|
|
{
|
|
"epoch": 0.48691860465116277,
|
|
"grad_norm": 0.592600128740923,
|
|
"learning_rate": 2.7717842323651454e-05,
|
|
"loss": 0.3464,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.23807524144649506,
|
|
"step": 335,
|
|
"valid_targets_mean": 6100.8,
|
|
"valid_targets_min": 4148
|
|
},
|
|
{
|
|
"epoch": 0.4941860465116279,
|
|
"grad_norm": 0.6395879958003222,
|
|
"learning_rate": 2.8132780082987556e-05,
|
|
"loss": 0.3426,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11755307763814926,
|
|
"step": 340,
|
|
"valid_targets_mean": 2526.9,
|
|
"valid_targets_min": 564
|
|
},
|
|
{
|
|
"epoch": 0.501453488372093,
|
|
"grad_norm": 0.7373583172871605,
|
|
"learning_rate": 2.8547717842323655e-05,
|
|
"loss": 0.3435,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18158669769763947,
|
|
"step": 345,
|
|
"valid_targets_mean": 3016.9,
|
|
"valid_targets_min": 663
|
|
},
|
|
{
|
|
"epoch": 0.5087209302325582,
|
|
"grad_norm": 0.6359067322988392,
|
|
"learning_rate": 2.8962655601659754e-05,
|
|
"loss": 0.3442,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13962212204933167,
|
|
"step": 350,
|
|
"valid_targets_mean": 3866.6,
|
|
"valid_targets_min": 602
|
|
},
|
|
{
|
|
"epoch": 0.5159883720930233,
|
|
"grad_norm": 0.6292053753904882,
|
|
"learning_rate": 2.9377593360995856e-05,
|
|
"loss": 0.3168,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13878588378429413,
|
|
"step": 355,
|
|
"valid_targets_mean": 2948.9,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 0.5232558139534884,
|
|
"grad_norm": 0.6465028968729859,
|
|
"learning_rate": 2.9792531120331955e-05,
|
|
"loss": 0.3223,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15605293214321136,
|
|
"step": 360,
|
|
"valid_targets_mean": 2838.6,
|
|
"valid_targets_min": 550
|
|
},
|
|
{
|
|
"epoch": 0.5305232558139535,
|
|
"grad_norm": 0.599120544848729,
|
|
"learning_rate": 3.020746887966805e-05,
|
|
"loss": 0.3301,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19232279062271118,
|
|
"step": 365,
|
|
"valid_targets_mean": 5084.5,
|
|
"valid_targets_min": 3708
|
|
},
|
|
{
|
|
"epoch": 0.5377906976744186,
|
|
"grad_norm": 0.6008656846497219,
|
|
"learning_rate": 3.062240663900415e-05,
|
|
"loss": 0.3372,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18847373127937317,
|
|
"step": 370,
|
|
"valid_targets_mean": 4938.4,
|
|
"valid_targets_min": 912
|
|
},
|
|
{
|
|
"epoch": 0.5450581395348837,
|
|
"grad_norm": 0.6285704558404371,
|
|
"learning_rate": 3.103734439834025e-05,
|
|
"loss": 0.3402,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.170862078666687,
|
|
"step": 375,
|
|
"valid_targets_mean": 3930.4,
|
|
"valid_targets_min": 980
|
|
},
|
|
{
|
|
"epoch": 0.5523255813953488,
|
|
"grad_norm": 0.631234804649969,
|
|
"learning_rate": 3.145228215767635e-05,
|
|
"loss": 0.3012,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12571334838867188,
|
|
"step": 380,
|
|
"valid_targets_mean": 3135.5,
|
|
"valid_targets_min": 663
|
|
},
|
|
{
|
|
"epoch": 0.559593023255814,
|
|
"grad_norm": 0.6821774303746879,
|
|
"learning_rate": 3.186721991701245e-05,
|
|
"loss": 0.3193,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14924553036689758,
|
|
"step": 385,
|
|
"valid_targets_mean": 3077.9,
|
|
"valid_targets_min": 545
|
|
},
|
|
{
|
|
"epoch": 0.5668604651162791,
|
|
"grad_norm": 0.9548135178922332,
|
|
"learning_rate": 3.2282157676348554e-05,
|
|
"loss": 0.3267,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13922418653964996,
|
|
"step": 390,
|
|
"valid_targets_mean": 2856.1,
|
|
"valid_targets_min": 603
|
|
},
|
|
{
|
|
"epoch": 0.5741279069767442,
|
|
"grad_norm": 0.6667391470008851,
|
|
"learning_rate": 3.2697095435684646e-05,
|
|
"loss": 0.3223,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1518375724554062,
|
|
"step": 395,
|
|
"valid_targets_mean": 3825.0,
|
|
"valid_targets_min": 563
|
|
},
|
|
{
|
|
"epoch": 0.5813953488372093,
|
|
"grad_norm": 0.7530532693129081,
|
|
"learning_rate": 3.3112033195020745e-05,
|
|
"loss": 0.3517,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16733457148075104,
|
|
"step": 400,
|
|
"valid_targets_mean": 3029.6,
|
|
"valid_targets_min": 657
|
|
},
|
|
{
|
|
"epoch": 0.5886627906976745,
|
|
"grad_norm": 0.6663888895860358,
|
|
"learning_rate": 3.352697095435685e-05,
|
|
"loss": 0.3137,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14393126964569092,
|
|
"step": 405,
|
|
"valid_targets_mean": 4312.1,
|
|
"valid_targets_min": 780
|
|
},
|
|
{
|
|
"epoch": 0.5959302325581395,
|
|
"grad_norm": 0.6660172981348241,
|
|
"learning_rate": 3.394190871369295e-05,
|
|
"loss": 0.326,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1679423302412033,
|
|
"step": 410,
|
|
"valid_targets_mean": 3628.2,
|
|
"valid_targets_min": 525
|
|
},
|
|
{
|
|
"epoch": 0.6031976744186046,
|
|
"grad_norm": 0.5769438912613716,
|
|
"learning_rate": 3.435684647302905e-05,
|
|
"loss": 0.3415,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13888345658779144,
|
|
"step": 415,
|
|
"valid_targets_mean": 2948.0,
|
|
"valid_targets_min": 629
|
|
},
|
|
{
|
|
"epoch": 0.6104651162790697,
|
|
"grad_norm": 0.6552132927034705,
|
|
"learning_rate": 3.477178423236515e-05,
|
|
"loss": 0.3226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1582183837890625,
|
|
"step": 420,
|
|
"valid_targets_mean": 3943.6,
|
|
"valid_targets_min": 805
|
|
},
|
|
{
|
|
"epoch": 0.6177325581395349,
|
|
"grad_norm": 0.605802257570494,
|
|
"learning_rate": 3.5186721991701245e-05,
|
|
"loss": 0.3392,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1685292273759842,
|
|
"step": 425,
|
|
"valid_targets_mean": 3261.0,
|
|
"valid_targets_min": 853
|
|
},
|
|
{
|
|
"epoch": 0.625,
|
|
"grad_norm": 0.6087478907133542,
|
|
"learning_rate": 3.5601659751037344e-05,
|
|
"loss": 0.3293,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1881280243396759,
|
|
"step": 430,
|
|
"valid_targets_mean": 4309.2,
|
|
"valid_targets_min": 729
|
|
},
|
|
{
|
|
"epoch": 0.6322674418604651,
|
|
"grad_norm": 0.7473680581058674,
|
|
"learning_rate": 3.601659751037345e-05,
|
|
"loss": 0.3198,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1361180990934372,
|
|
"step": 435,
|
|
"valid_targets_mean": 3453.4,
|
|
"valid_targets_min": 662
|
|
},
|
|
{
|
|
"epoch": 0.6395348837209303,
|
|
"grad_norm": 0.6504764288016779,
|
|
"learning_rate": 3.643153526970955e-05,
|
|
"loss": 0.3107,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1473781168460846,
|
|
"step": 440,
|
|
"valid_targets_mean": 3510.0,
|
|
"valid_targets_min": 490
|
|
},
|
|
{
|
|
"epoch": 0.6468023255813954,
|
|
"grad_norm": 0.7669144042878424,
|
|
"learning_rate": 3.684647302904565e-05,
|
|
"loss": 0.3209,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2131597101688385,
|
|
"step": 445,
|
|
"valid_targets_mean": 3796.1,
|
|
"valid_targets_min": 476
|
|
},
|
|
{
|
|
"epoch": 0.6540697674418605,
|
|
"grad_norm": 0.6403304907544071,
|
|
"learning_rate": 3.7261410788381746e-05,
|
|
"loss": 0.3323,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14401483535766602,
|
|
"step": 450,
|
|
"valid_targets_mean": 3364.4,
|
|
"valid_targets_min": 655
|
|
},
|
|
{
|
|
"epoch": 0.6613372093023255,
|
|
"grad_norm": 0.645985011133752,
|
|
"learning_rate": 3.7676348547717845e-05,
|
|
"loss": 0.3105,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.136003777384758,
|
|
"step": 455,
|
|
"valid_targets_mean": 2819.6,
|
|
"valid_targets_min": 687
|
|
},
|
|
{
|
|
"epoch": 0.6686046511627907,
|
|
"grad_norm": 0.7585240879141193,
|
|
"learning_rate": 3.8091286307053944e-05,
|
|
"loss": 0.3301,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1501508355140686,
|
|
"step": 460,
|
|
"valid_targets_mean": 3316.0,
|
|
"valid_targets_min": 693
|
|
},
|
|
{
|
|
"epoch": 0.6758720930232558,
|
|
"grad_norm": 0.7281883856779292,
|
|
"learning_rate": 3.850622406639004e-05,
|
|
"loss": 0.3154,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18056277930736542,
|
|
"step": 465,
|
|
"valid_targets_mean": 3833.4,
|
|
"valid_targets_min": 740
|
|
},
|
|
{
|
|
"epoch": 0.6831395348837209,
|
|
"grad_norm": 0.6535897957871524,
|
|
"learning_rate": 3.892116182572614e-05,
|
|
"loss": 0.3254,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.156234472990036,
|
|
"step": 470,
|
|
"valid_targets_mean": 3719.0,
|
|
"valid_targets_min": 824
|
|
},
|
|
{
|
|
"epoch": 0.690406976744186,
|
|
"grad_norm": 0.6187781320054627,
|
|
"learning_rate": 3.933609958506224e-05,
|
|
"loss": 0.3074,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14327925443649292,
|
|
"step": 475,
|
|
"valid_targets_mean": 3327.1,
|
|
"valid_targets_min": 667
|
|
},
|
|
{
|
|
"epoch": 0.6976744186046512,
|
|
"grad_norm": 0.6409941888826423,
|
|
"learning_rate": 3.9751037344398345e-05,
|
|
"loss": 0.3266,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18486058712005615,
|
|
"step": 480,
|
|
"valid_targets_mean": 4941.5,
|
|
"valid_targets_min": 729
|
|
},
|
|
{
|
|
"epoch": 0.7049418604651163,
|
|
"grad_norm": 0.6253158306971405,
|
|
"learning_rate": 3.999997898246174e-05,
|
|
"loss": 0.3114,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1806681752204895,
|
|
"step": 485,
|
|
"valid_targets_mean": 4048.6,
|
|
"valid_targets_min": 659
|
|
},
|
|
{
|
|
"epoch": 0.7122093023255814,
|
|
"grad_norm": 0.6250751502415329,
|
|
"learning_rate": 3.999974253566362e-05,
|
|
"loss": 0.3187,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16524715721607208,
|
|
"step": 490,
|
|
"valid_targets_mean": 3338.9,
|
|
"valid_targets_min": 594
|
|
},
|
|
{
|
|
"epoch": 0.7194767441860465,
|
|
"grad_norm": 0.6124032350122675,
|
|
"learning_rate": 3.999924337326085e-05,
|
|
"loss": 0.3126,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13034440577030182,
|
|
"step": 495,
|
|
"valid_targets_mean": 2214.9,
|
|
"valid_targets_min": 578
|
|
},
|
|
{
|
|
"epoch": 0.7267441860465116,
|
|
"grad_norm": 0.9029943456959502,
|
|
"learning_rate": 3.9998481501810414e-05,
|
|
"loss": 0.3149,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1411435753107071,
|
|
"step": 500,
|
|
"valid_targets_mean": 3521.5,
|
|
"valid_targets_min": 634
|
|
},
|
|
{
|
|
"epoch": 0.7340116279069767,
|
|
"grad_norm": 0.6114689481192495,
|
|
"learning_rate": 3.999745693132021e-05,
|
|
"loss": 0.2994,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11579418182373047,
|
|
"step": 505,
|
|
"valid_targets_mean": 3004.8,
|
|
"valid_targets_min": 560
|
|
},
|
|
{
|
|
"epoch": 0.7412790697674418,
|
|
"grad_norm": 0.561556329434712,
|
|
"learning_rate": 3.999616967524894e-05,
|
|
"loss": 0.318,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16953226923942566,
|
|
"step": 510,
|
|
"valid_targets_mean": 4547.9,
|
|
"valid_targets_min": 971
|
|
},
|
|
{
|
|
"epoch": 0.748546511627907,
|
|
"grad_norm": 0.6387062020360811,
|
|
"learning_rate": 3.999461975050595e-05,
|
|
"loss": 0.3382,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.2010563313961029,
|
|
"step": 515,
|
|
"valid_targets_mean": 4711.6,
|
|
"valid_targets_min": 800
|
|
},
|
|
{
|
|
"epoch": 0.7558139534883721,
|
|
"grad_norm": 0.6150223941673152,
|
|
"learning_rate": 3.9992807177450956e-05,
|
|
"loss": 0.3091,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1380336582660675,
|
|
"step": 520,
|
|
"valid_targets_mean": 2641.8,
|
|
"valid_targets_min": 535
|
|
},
|
|
{
|
|
"epoch": 0.7630813953488372,
|
|
"grad_norm": 0.6623311527635831,
|
|
"learning_rate": 3.9990731979893834e-05,
|
|
"loss": 0.323,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17421071231365204,
|
|
"step": 525,
|
|
"valid_targets_mean": 3310.9,
|
|
"valid_targets_min": 815
|
|
},
|
|
{
|
|
"epoch": 0.7703488372093024,
|
|
"grad_norm": 0.644574318586418,
|
|
"learning_rate": 3.998839418509428e-05,
|
|
"loss": 0.3152,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1878730207681656,
|
|
"step": 530,
|
|
"valid_targets_mean": 4664.6,
|
|
"valid_targets_min": 697
|
|
},
|
|
{
|
|
"epoch": 0.7776162790697675,
|
|
"grad_norm": 0.5151536823530193,
|
|
"learning_rate": 3.998579382376143e-05,
|
|
"loss": 0.3181,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17093926668167114,
|
|
"step": 535,
|
|
"valid_targets_mean": 4806.2,
|
|
"valid_targets_min": 3993
|
|
},
|
|
{
|
|
"epoch": 0.7848837209302325,
|
|
"grad_norm": 0.5848122250774543,
|
|
"learning_rate": 3.9982930930053515e-05,
|
|
"loss": 0.3197,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19000868499279022,
|
|
"step": 540,
|
|
"valid_targets_mean": 4433.6,
|
|
"valid_targets_min": 772
|
|
},
|
|
{
|
|
"epoch": 0.7921511627906976,
|
|
"grad_norm": 0.6907826286413288,
|
|
"learning_rate": 3.9979805541577356e-05,
|
|
"loss": 0.3189,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12706348299980164,
|
|
"step": 545,
|
|
"valid_targets_mean": 2434.2,
|
|
"valid_targets_min": 647
|
|
},
|
|
{
|
|
"epoch": 0.7994186046511628,
|
|
"grad_norm": 0.5759344182112125,
|
|
"learning_rate": 3.99764176993879e-05,
|
|
"loss": 0.3178,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13058075308799744,
|
|
"step": 550,
|
|
"valid_targets_mean": 3536.2,
|
|
"valid_targets_min": 803
|
|
},
|
|
{
|
|
"epoch": 0.8066860465116279,
|
|
"grad_norm": 0.5679171468274491,
|
|
"learning_rate": 3.997276744798766e-05,
|
|
"loss": 0.3121,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18033181130886078,
|
|
"step": 555,
|
|
"valid_targets_mean": 4196.0,
|
|
"valid_targets_min": 907
|
|
},
|
|
{
|
|
"epoch": 0.813953488372093,
|
|
"grad_norm": 0.5257948098452856,
|
|
"learning_rate": 3.996885483532617e-05,
|
|
"loss": 0.3126,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16494852304458618,
|
|
"step": 560,
|
|
"valid_targets_mean": 4555.4,
|
|
"valid_targets_min": 707
|
|
},
|
|
{
|
|
"epoch": 0.8212209302325582,
|
|
"grad_norm": 0.6873649278599748,
|
|
"learning_rate": 3.9964679912799306e-05,
|
|
"loss": 0.3127,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1650257706642151,
|
|
"step": 565,
|
|
"valid_targets_mean": 3825.8,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 0.8284883720930233,
|
|
"grad_norm": 0.5750252747412078,
|
|
"learning_rate": 3.9960242735248626e-05,
|
|
"loss": 0.3341,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1479925811290741,
|
|
"step": 570,
|
|
"valid_targets_mean": 3665.1,
|
|
"valid_targets_min": 946
|
|
},
|
|
{
|
|
"epoch": 0.8357558139534884,
|
|
"grad_norm": 0.600940591918952,
|
|
"learning_rate": 3.995554336096069e-05,
|
|
"loss": 0.3386,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12769609689712524,
|
|
"step": 575,
|
|
"valid_targets_mean": 4007.4,
|
|
"valid_targets_min": 433
|
|
},
|
|
{
|
|
"epoch": 0.8430232558139535,
|
|
"grad_norm": 0.5800527572863078,
|
|
"learning_rate": 3.995058185166623e-05,
|
|
"loss": 0.3014,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13579922914505005,
|
|
"step": 580,
|
|
"valid_targets_mean": 3511.2,
|
|
"valid_targets_min": 510
|
|
},
|
|
{
|
|
"epoch": 0.8502906976744186,
|
|
"grad_norm": 0.5904946794486696,
|
|
"learning_rate": 3.9945358272539373e-05,
|
|
"loss": 0.3036,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13859254121780396,
|
|
"step": 585,
|
|
"valid_targets_mean": 3177.5,
|
|
"valid_targets_min": 514
|
|
},
|
|
{
|
|
"epoch": 0.8575581395348837,
|
|
"grad_norm": 0.6700979896386047,
|
|
"learning_rate": 3.9939872692196805e-05,
|
|
"loss": 0.3081,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18660062551498413,
|
|
"step": 590,
|
|
"valid_targets_mean": 2899.0,
|
|
"valid_targets_min": 559
|
|
},
|
|
{
|
|
"epoch": 0.8648255813953488,
|
|
"grad_norm": 0.5746632492683453,
|
|
"learning_rate": 3.993412518269682e-05,
|
|
"loss": 0.3211,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1774902641773224,
|
|
"step": 595,
|
|
"valid_targets_mean": 4287.2,
|
|
"valid_targets_min": 743
|
|
},
|
|
{
|
|
"epoch": 0.872093023255814,
|
|
"grad_norm": 0.5380377747396158,
|
|
"learning_rate": 3.9928115819538416e-05,
|
|
"loss": 0.3141,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1711953580379486,
|
|
"step": 600,
|
|
"valid_targets_mean": 4814.6,
|
|
"valid_targets_min": 4037
|
|
},
|
|
{
|
|
"epoch": 0.8793604651162791,
|
|
"grad_norm": 0.6207951561335642,
|
|
"learning_rate": 3.992184468166028e-05,
|
|
"loss": 0.3158,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1701497882604599,
|
|
"step": 605,
|
|
"valid_targets_mean": 3301.4,
|
|
"valid_targets_min": 655
|
|
},
|
|
{
|
|
"epoch": 0.8866279069767442,
|
|
"grad_norm": 0.6066474074945402,
|
|
"learning_rate": 3.991531185143977e-05,
|
|
"loss": 0.2911,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14605024456977844,
|
|
"step": 610,
|
|
"valid_targets_mean": 3370.5,
|
|
"valid_targets_min": 611
|
|
},
|
|
{
|
|
"epoch": 0.8938953488372093,
|
|
"grad_norm": 0.528974517437865,
|
|
"learning_rate": 3.9908517414691806e-05,
|
|
"loss": 0.3,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14421282708644867,
|
|
"step": 615,
|
|
"valid_targets_mean": 3871.6,
|
|
"valid_targets_min": 1000
|
|
},
|
|
{
|
|
"epoch": 0.9011627906976745,
|
|
"grad_norm": 0.5593482014821316,
|
|
"learning_rate": 3.990146146066776e-05,
|
|
"loss": 0.3123,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15519869327545166,
|
|
"step": 620,
|
|
"valid_targets_mean": 4097.6,
|
|
"valid_targets_min": 878
|
|
},
|
|
{
|
|
"epoch": 0.9084302325581395,
|
|
"grad_norm": 0.6465303654402883,
|
|
"learning_rate": 3.98941440820543e-05,
|
|
"loss": 0.3146,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1523018181324005,
|
|
"step": 625,
|
|
"valid_targets_mean": 2658.4,
|
|
"valid_targets_min": 534
|
|
},
|
|
{
|
|
"epoch": 0.9156976744186046,
|
|
"grad_norm": 0.6464191733061095,
|
|
"learning_rate": 3.988656537497213e-05,
|
|
"loss": 0.3188,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15685781836509705,
|
|
"step": 630,
|
|
"valid_targets_mean": 2272.4,
|
|
"valid_targets_min": 707
|
|
},
|
|
{
|
|
"epoch": 0.9229651162790697,
|
|
"grad_norm": 0.6363180627039392,
|
|
"learning_rate": 3.987872543897477e-05,
|
|
"loss": 0.3121,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16334350407123566,
|
|
"step": 635,
|
|
"valid_targets_mean": 3598.2,
|
|
"valid_targets_min": 808
|
|
},
|
|
{
|
|
"epoch": 0.9302325581395349,
|
|
"grad_norm": 0.6442381315821747,
|
|
"learning_rate": 3.9870624377047206e-05,
|
|
"loss": 0.3225,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17397740483283997,
|
|
"step": 640,
|
|
"valid_targets_mean": 3169.8,
|
|
"valid_targets_min": 668
|
|
},
|
|
{
|
|
"epoch": 0.9375,
|
|
"grad_norm": 0.5925230417676065,
|
|
"learning_rate": 3.9862262295604594e-05,
|
|
"loss": 0.3029,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1986408531665802,
|
|
"step": 645,
|
|
"valid_targets_mean": 4408.5,
|
|
"valid_targets_min": 636
|
|
},
|
|
{
|
|
"epoch": 0.9447674418604651,
|
|
"grad_norm": 0.5912132183519685,
|
|
"learning_rate": 3.9853639304490815e-05,
|
|
"loss": 0.2946,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19908586144447327,
|
|
"step": 650,
|
|
"valid_targets_mean": 4032.0,
|
|
"valid_targets_min": 788
|
|
},
|
|
{
|
|
"epoch": 0.9520348837209303,
|
|
"grad_norm": 0.5233197409282695,
|
|
"learning_rate": 3.984475551697703e-05,
|
|
"loss": 0.3185,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1765996813774109,
|
|
"step": 655,
|
|
"valid_targets_mean": 3893.4,
|
|
"valid_targets_min": 811
|
|
},
|
|
{
|
|
"epoch": 0.9593023255813954,
|
|
"grad_norm": 0.5996865078000508,
|
|
"learning_rate": 3.9835611049760216e-05,
|
|
"loss": 0.3232,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19216126203536987,
|
|
"step": 660,
|
|
"valid_targets_mean": 3420.6,
|
|
"valid_targets_min": 471
|
|
},
|
|
{
|
|
"epoch": 0.9665697674418605,
|
|
"grad_norm": 0.5167680016756202,
|
|
"learning_rate": 3.982620602296166e-05,
|
|
"loss": 0.3122,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13381856679916382,
|
|
"step": 665,
|
|
"valid_targets_mean": 3309.5,
|
|
"valid_targets_min": 748
|
|
},
|
|
{
|
|
"epoch": 0.9738372093023255,
|
|
"grad_norm": 0.5746446225121188,
|
|
"learning_rate": 3.981654056012529e-05,
|
|
"loss": 0.3094,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11602400243282318,
|
|
"step": 670,
|
|
"valid_targets_mean": 2765.1,
|
|
"valid_targets_min": 549
|
|
},
|
|
{
|
|
"epoch": 0.9811046511627907,
|
|
"grad_norm": 0.6434502337970205,
|
|
"learning_rate": 3.980661478821614e-05,
|
|
"loss": 0.3454,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1325831413269043,
|
|
"step": 675,
|
|
"valid_targets_mean": 2170.1,
|
|
"valid_targets_min": 500
|
|
},
|
|
{
|
|
"epoch": 0.9883720930232558,
|
|
"grad_norm": 0.6068667229565959,
|
|
"learning_rate": 3.979642883761866e-05,
|
|
"loss": 0.2994,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.21635717153549194,
|
|
"step": 680,
|
|
"valid_targets_mean": 4260.9,
|
|
"valid_targets_min": 732
|
|
},
|
|
{
|
|
"epoch": 0.9956395348837209,
|
|
"grad_norm": 0.4944733997393646,
|
|
"learning_rate": 3.978598284213497e-05,
|
|
"loss": 0.2988,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15469247102737427,
|
|
"step": 685,
|
|
"valid_targets_mean": 4212.6,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 1.002906976744186,
|
|
"grad_norm": 0.5954258533422989,
|
|
"learning_rate": 3.9775276938983144e-05,
|
|
"loss": 0.3086,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1707223355770111,
|
|
"step": 690,
|
|
"valid_targets_mean": 3524.9,
|
|
"valid_targets_min": 889
|
|
},
|
|
{
|
|
"epoch": 1.010174418604651,
|
|
"grad_norm": 0.5020818956819496,
|
|
"learning_rate": 3.9764311268795374e-05,
|
|
"loss": 0.2837,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13558289408683777,
|
|
"step": 695,
|
|
"valid_targets_mean": 4481.9,
|
|
"valid_targets_min": 612
|
|
},
|
|
{
|
|
"epoch": 1.0174418604651163,
|
|
"grad_norm": 0.5115399057944376,
|
|
"learning_rate": 3.9753085975616157e-05,
|
|
"loss": 0.3015,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15828119218349457,
|
|
"step": 700,
|
|
"valid_targets_mean": 4807.2,
|
|
"valid_targets_min": 621
|
|
},
|
|
{
|
|
"epoch": 1.0247093023255813,
|
|
"grad_norm": 0.6295735522719244,
|
|
"learning_rate": 3.9741601206900376e-05,
|
|
"loss": 0.294,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12198431044816971,
|
|
"step": 705,
|
|
"valid_targets_mean": 2282.0,
|
|
"valid_targets_min": 628
|
|
},
|
|
{
|
|
"epoch": 1.0319767441860466,
|
|
"grad_norm": 0.6530251313106338,
|
|
"learning_rate": 3.972985711351136e-05,
|
|
"loss": 0.3069,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1703912913799286,
|
|
"step": 710,
|
|
"valid_targets_mean": 2788.5,
|
|
"valid_targets_min": 508
|
|
},
|
|
{
|
|
"epoch": 1.0392441860465116,
|
|
"grad_norm": 0.7380539475948441,
|
|
"learning_rate": 3.971785384971894e-05,
|
|
"loss": 0.2876,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18880873918533325,
|
|
"step": 715,
|
|
"valid_targets_mean": 5222.1,
|
|
"valid_targets_min": 550
|
|
},
|
|
{
|
|
"epoch": 1.0465116279069768,
|
|
"grad_norm": 0.5226027075387328,
|
|
"learning_rate": 3.970559157319737e-05,
|
|
"loss": 0.2858,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17227350175380707,
|
|
"step": 720,
|
|
"valid_targets_mean": 4441.9,
|
|
"valid_targets_min": 662
|
|
},
|
|
{
|
|
"epoch": 1.0537790697674418,
|
|
"grad_norm": 0.5203168649565341,
|
|
"learning_rate": 3.9693070445023297e-05,
|
|
"loss": 0.3006,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14260490238666534,
|
|
"step": 725,
|
|
"valid_targets_mean": 4482.8,
|
|
"valid_targets_min": 546
|
|
},
|
|
{
|
|
"epoch": 1.0610465116279069,
|
|
"grad_norm": 0.6553194107917635,
|
|
"learning_rate": 3.968029062967363e-05,
|
|
"loss": 0.3136,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15954704582691193,
|
|
"step": 730,
|
|
"valid_targets_mean": 2214.1,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 1.068313953488372,
|
|
"grad_norm": 0.5924767029335875,
|
|
"learning_rate": 3.966725229502336e-05,
|
|
"loss": 0.2906,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13051603734493256,
|
|
"step": 735,
|
|
"valid_targets_mean": 2960.1,
|
|
"valid_targets_min": 852
|
|
},
|
|
{
|
|
"epoch": 1.0755813953488371,
|
|
"grad_norm": 0.6145150473623321,
|
|
"learning_rate": 3.965395561234341e-05,
|
|
"loss": 0.2918,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14821113646030426,
|
|
"step": 740,
|
|
"valid_targets_mean": 3790.0,
|
|
"valid_targets_min": 594
|
|
},
|
|
{
|
|
"epoch": 1.0828488372093024,
|
|
"grad_norm": 0.6427556361525683,
|
|
"learning_rate": 3.9640400756298325e-05,
|
|
"loss": 0.2938,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11527499556541443,
|
|
"step": 745,
|
|
"valid_targets_mean": 2748.6,
|
|
"valid_targets_min": 592
|
|
},
|
|
{
|
|
"epoch": 1.0901162790697674,
|
|
"grad_norm": 0.5381745813762965,
|
|
"learning_rate": 3.9626587904943996e-05,
|
|
"loss": 0.2932,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15444537997245789,
|
|
"step": 750,
|
|
"valid_targets_mean": 3721.0,
|
|
"valid_targets_min": 617
|
|
},
|
|
{
|
|
"epoch": 1.0973837209302326,
|
|
"grad_norm": 0.6262758723974868,
|
|
"learning_rate": 3.961251723972535e-05,
|
|
"loss": 0.2966,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1222953200340271,
|
|
"step": 755,
|
|
"valid_targets_mean": 2428.2,
|
|
"valid_targets_min": 484
|
|
},
|
|
{
|
|
"epoch": 1.1046511627906976,
|
|
"grad_norm": 0.6024971681939152,
|
|
"learning_rate": 3.959818894547393e-05,
|
|
"loss": 0.288,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1502443253993988,
|
|
"step": 760,
|
|
"valid_targets_mean": 3520.6,
|
|
"valid_targets_min": 667
|
|
},
|
|
{
|
|
"epoch": 1.1119186046511629,
|
|
"grad_norm": 0.6024643305619749,
|
|
"learning_rate": 3.9583603210405484e-05,
|
|
"loss": 0.2866,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1113622784614563,
|
|
"step": 765,
|
|
"valid_targets_mean": 2564.2,
|
|
"valid_targets_min": 469
|
|
},
|
|
{
|
|
"epoch": 1.119186046511628,
|
|
"grad_norm": 0.6075985529163336,
|
|
"learning_rate": 3.956876022611748e-05,
|
|
"loss": 0.2917,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1365235447883606,
|
|
"step": 770,
|
|
"valid_targets_mean": 2986.5,
|
|
"valid_targets_min": 772
|
|
},
|
|
{
|
|
"epoch": 1.1264534883720931,
|
|
"grad_norm": 0.5847751575794944,
|
|
"learning_rate": 3.9553660187586625e-05,
|
|
"loss": 0.2948,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13294722139835358,
|
|
"step": 775,
|
|
"valid_targets_mean": 3096.1,
|
|
"valid_targets_min": 686
|
|
},
|
|
{
|
|
"epoch": 1.1337209302325582,
|
|
"grad_norm": 0.5594747695034635,
|
|
"learning_rate": 3.9538303293166243e-05,
|
|
"loss": 0.2819,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13940271735191345,
|
|
"step": 780,
|
|
"valid_targets_mean": 3422.9,
|
|
"valid_targets_min": 912
|
|
},
|
|
{
|
|
"epoch": 1.1409883720930232,
|
|
"grad_norm": 0.5444550515911036,
|
|
"learning_rate": 3.952268974458373e-05,
|
|
"loss": 0.3074,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13107138872146606,
|
|
"step": 785,
|
|
"valid_targets_mean": 4094.4,
|
|
"valid_targets_min": 586
|
|
},
|
|
{
|
|
"epoch": 1.1482558139534884,
|
|
"grad_norm": 0.8455637167751516,
|
|
"learning_rate": 3.950681974693787e-05,
|
|
"loss": 0.2931,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1299535632133484,
|
|
"step": 790,
|
|
"valid_targets_mean": 3531.8,
|
|
"valid_targets_min": 476
|
|
},
|
|
{
|
|
"epoch": 1.1555232558139534,
|
|
"grad_norm": 0.5600026310525352,
|
|
"learning_rate": 3.949069350869614e-05,
|
|
"loss": 0.3147,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1660255640745163,
|
|
"step": 795,
|
|
"valid_targets_mean": 3931.5,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 1.1627906976744187,
|
|
"grad_norm": 0.5787989442009414,
|
|
"learning_rate": 3.9474311241691994e-05,
|
|
"loss": 0.3049,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11841486394405365,
|
|
"step": 800,
|
|
"valid_targets_mean": 2689.1,
|
|
"valid_targets_min": 377
|
|
},
|
|
{
|
|
"epoch": 1.1700581395348837,
|
|
"grad_norm": 0.5607944017063098,
|
|
"learning_rate": 3.945767316112206e-05,
|
|
"loss": 0.3073,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1844930201768875,
|
|
"step": 805,
|
|
"valid_targets_mean": 4312.1,
|
|
"valid_targets_min": 596
|
|
},
|
|
{
|
|
"epoch": 1.177325581395349,
|
|
"grad_norm": 0.5505080993653617,
|
|
"learning_rate": 3.944077948554333e-05,
|
|
"loss": 0.302,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14519767463207245,
|
|
"step": 810,
|
|
"valid_targets_mean": 3942.4,
|
|
"valid_targets_min": 666
|
|
},
|
|
{
|
|
"epoch": 1.184593023255814,
|
|
"grad_norm": 0.5661161246942287,
|
|
"learning_rate": 3.9423630436870255e-05,
|
|
"loss": 0.2843,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11194830387830734,
|
|
"step": 815,
|
|
"valid_targets_mean": 2164.8,
|
|
"valid_targets_min": 467
|
|
},
|
|
{
|
|
"epoch": 1.191860465116279,
|
|
"grad_norm": 0.5120139801918556,
|
|
"learning_rate": 3.940622624037188e-05,
|
|
"loss": 0.3015,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12605825066566467,
|
|
"step": 820,
|
|
"valid_targets_mean": 3943.4,
|
|
"valid_targets_min": 716
|
|
},
|
|
{
|
|
"epoch": 1.1991279069767442,
|
|
"grad_norm": 0.525392557133716,
|
|
"learning_rate": 3.938856712466885e-05,
|
|
"loss": 0.2788,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1255475878715515,
|
|
"step": 825,
|
|
"valid_targets_mean": 3209.6,
|
|
"valid_targets_min": 484
|
|
},
|
|
{
|
|
"epoch": 1.2063953488372092,
|
|
"grad_norm": 0.657741147392811,
|
|
"learning_rate": 3.93706533217304e-05,
|
|
"loss": 0.29,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15574149787425995,
|
|
"step": 830,
|
|
"valid_targets_mean": 2886.0,
|
|
"valid_targets_min": 750
|
|
},
|
|
{
|
|
"epoch": 1.2136627906976745,
|
|
"grad_norm": 0.5516109167421356,
|
|
"learning_rate": 3.935248506687136e-05,
|
|
"loss": 0.302,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18783080577850342,
|
|
"step": 835,
|
|
"valid_targets_mean": 4719.0,
|
|
"valid_targets_min": 731
|
|
},
|
|
{
|
|
"epoch": 1.2209302325581395,
|
|
"grad_norm": 0.49925446777716886,
|
|
"learning_rate": 3.9334062598748986e-05,
|
|
"loss": 0.2899,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11280782520771027,
|
|
"step": 840,
|
|
"valid_targets_mean": 3761.0,
|
|
"valid_targets_min": 624
|
|
},
|
|
{
|
|
"epoch": 1.2281976744186047,
|
|
"grad_norm": 0.5011178404184398,
|
|
"learning_rate": 3.931538615935989e-05,
|
|
"loss": 0.2746,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12659627199172974,
|
|
"step": 845,
|
|
"valid_targets_mean": 3629.0,
|
|
"valid_targets_min": 695
|
|
},
|
|
{
|
|
"epoch": 1.2354651162790697,
|
|
"grad_norm": 0.4930281326129707,
|
|
"learning_rate": 3.929645599403684e-05,
|
|
"loss": 0.2905,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11583171039819717,
|
|
"step": 850,
|
|
"valid_targets_mean": 3803.5,
|
|
"valid_targets_min": 518
|
|
},
|
|
{
|
|
"epoch": 1.2427325581395348,
|
|
"grad_norm": 0.5801439996466439,
|
|
"learning_rate": 3.9277272351445524e-05,
|
|
"loss": 0.2858,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13249947130680084,
|
|
"step": 855,
|
|
"valid_targets_mean": 2848.5,
|
|
"valid_targets_min": 795
|
|
},
|
|
{
|
|
"epoch": 1.25,
|
|
"grad_norm": 0.5622353243784237,
|
|
"learning_rate": 3.9257835483581306e-05,
|
|
"loss": 0.2965,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13136523962020874,
|
|
"step": 860,
|
|
"valid_targets_mean": 3588.1,
|
|
"valid_targets_min": 868
|
|
},
|
|
{
|
|
"epoch": 1.2572674418604652,
|
|
"grad_norm": 0.6131025997715869,
|
|
"learning_rate": 3.923814564576589e-05,
|
|
"loss": 0.287,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15739820897579193,
|
|
"step": 865,
|
|
"valid_targets_mean": 3525.5,
|
|
"valid_targets_min": 700
|
|
},
|
|
{
|
|
"epoch": 1.2645348837209303,
|
|
"grad_norm": 0.5310602027404243,
|
|
"learning_rate": 3.921820309664398e-05,
|
|
"loss": 0.2969,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1796557605266571,
|
|
"step": 870,
|
|
"valid_targets_mean": 4290.6,
|
|
"valid_targets_min": 1106
|
|
},
|
|
{
|
|
"epoch": 1.2718023255813953,
|
|
"grad_norm": 0.5665637728934327,
|
|
"learning_rate": 3.91980080981799e-05,
|
|
"loss": 0.2987,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15872395038604736,
|
|
"step": 875,
|
|
"valid_targets_mean": 3355.1,
|
|
"valid_targets_min": 479
|
|
},
|
|
{
|
|
"epoch": 1.2790697674418605,
|
|
"grad_norm": 0.5123883343895528,
|
|
"learning_rate": 3.917756091565414e-05,
|
|
"loss": 0.2951,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12424245476722717,
|
|
"step": 880,
|
|
"valid_targets_mean": 3292.4,
|
|
"valid_targets_min": 591
|
|
},
|
|
{
|
|
"epoch": 1.2863372093023255,
|
|
"grad_norm": 0.5418967521351696,
|
|
"learning_rate": 3.915686181765983e-05,
|
|
"loss": 0.2985,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12708592414855957,
|
|
"step": 885,
|
|
"valid_targets_mean": 2999.8,
|
|
"valid_targets_min": 655
|
|
},
|
|
{
|
|
"epoch": 1.2936046511627908,
|
|
"grad_norm": 0.5430718445751821,
|
|
"learning_rate": 3.9135911076099286e-05,
|
|
"loss": 0.2912,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1379009634256363,
|
|
"step": 890,
|
|
"valid_targets_mean": 3595.6,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 1.3008720930232558,
|
|
"grad_norm": 0.526588721715433,
|
|
"learning_rate": 3.9114708966180385e-05,
|
|
"loss": 0.2869,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15102040767669678,
|
|
"step": 895,
|
|
"valid_targets_mean": 4072.5,
|
|
"valid_targets_min": 891
|
|
},
|
|
{
|
|
"epoch": 1.308139534883721,
|
|
"grad_norm": 0.5047952119967307,
|
|
"learning_rate": 3.909325576641298e-05,
|
|
"loss": 0.293,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1750989854335785,
|
|
"step": 900,
|
|
"valid_targets_mean": 5263.9,
|
|
"valid_targets_min": 3460
|
|
},
|
|
{
|
|
"epoch": 1.315406976744186,
|
|
"grad_norm": 0.496714389262161,
|
|
"learning_rate": 3.907155175860519e-05,
|
|
"loss": 0.2764,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12206344306468964,
|
|
"step": 905,
|
|
"valid_targets_mean": 3841.0,
|
|
"valid_targets_min": 840
|
|
},
|
|
{
|
|
"epoch": 1.322674418604651,
|
|
"grad_norm": 0.548533268898909,
|
|
"learning_rate": 3.904959722785978e-05,
|
|
"loss": 0.2991,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1320100873708725,
|
|
"step": 910,
|
|
"valid_targets_mean": 3564.2,
|
|
"valid_targets_min": 428
|
|
},
|
|
{
|
|
"epoch": 1.3299418604651163,
|
|
"grad_norm": 0.5709238019153562,
|
|
"learning_rate": 3.902739246257035e-05,
|
|
"loss": 0.3012,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16724197566509247,
|
|
"step": 915,
|
|
"valid_targets_mean": 3494.5,
|
|
"valid_targets_min": 771
|
|
},
|
|
{
|
|
"epoch": 1.3372093023255813,
|
|
"grad_norm": 0.6026091154187614,
|
|
"learning_rate": 3.9004937754417576e-05,
|
|
"loss": 0.2879,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1599448174238205,
|
|
"step": 920,
|
|
"valid_targets_mean": 3057.8,
|
|
"valid_targets_min": 590
|
|
},
|
|
{
|
|
"epoch": 1.3444767441860466,
|
|
"grad_norm": 0.5583822762143399,
|
|
"learning_rate": 3.898223339836535e-05,
|
|
"loss": 0.2905,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13246658444404602,
|
|
"step": 925,
|
|
"valid_targets_mean": 2905.2,
|
|
"valid_targets_min": 332
|
|
},
|
|
{
|
|
"epoch": 1.3517441860465116,
|
|
"grad_norm": 0.4972947567573365,
|
|
"learning_rate": 3.8959279692656965e-05,
|
|
"loss": 0.2739,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11695317924022675,
|
|
"step": 930,
|
|
"valid_targets_mean": 3299.1,
|
|
"valid_targets_min": 763
|
|
},
|
|
{
|
|
"epoch": 1.3590116279069768,
|
|
"grad_norm": 0.6349529472272955,
|
|
"learning_rate": 3.893607693881113e-05,
|
|
"loss": 0.2888,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13736936450004578,
|
|
"step": 935,
|
|
"valid_targets_mean": 2173.0,
|
|
"valid_targets_min": 570
|
|
},
|
|
{
|
|
"epoch": 1.3662790697674418,
|
|
"grad_norm": 0.5235242978606963,
|
|
"learning_rate": 3.8912625441618034e-05,
|
|
"loss": 0.3246,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.22577857971191406,
|
|
"step": 940,
|
|
"valid_targets_mean": 5353.6,
|
|
"valid_targets_min": 779
|
|
},
|
|
{
|
|
"epoch": 1.3735465116279069,
|
|
"grad_norm": 0.507118960736435,
|
|
"learning_rate": 3.8888925509135365e-05,
|
|
"loss": 0.2873,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15891097486019135,
|
|
"step": 945,
|
|
"valid_targets_mean": 4224.1,
|
|
"valid_targets_min": 565
|
|
},
|
|
{
|
|
"epoch": 1.380813953488372,
|
|
"grad_norm": 0.5727509164803489,
|
|
"learning_rate": 3.8864977452684235e-05,
|
|
"loss": 0.2943,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11320075392723083,
|
|
"step": 950,
|
|
"valid_targets_mean": 3410.9,
|
|
"valid_targets_min": 671
|
|
},
|
|
{
|
|
"epoch": 1.3880813953488373,
|
|
"grad_norm": 0.6089894761450095,
|
|
"learning_rate": 3.88407815868451e-05,
|
|
"loss": 0.2838,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12657169997692108,
|
|
"step": 955,
|
|
"valid_targets_mean": 2158.1,
|
|
"valid_targets_min": 587
|
|
},
|
|
{
|
|
"epoch": 1.3953488372093024,
|
|
"grad_norm": 0.5874352781433988,
|
|
"learning_rate": 3.8816338229453616e-05,
|
|
"loss": 0.2948,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15347419679164886,
|
|
"step": 960,
|
|
"valid_targets_mean": 3367.5,
|
|
"valid_targets_min": 666
|
|
},
|
|
{
|
|
"epoch": 1.4026162790697674,
|
|
"grad_norm": 0.6166326785595897,
|
|
"learning_rate": 3.879164770159651e-05,
|
|
"loss": 0.2839,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14318858087062836,
|
|
"step": 965,
|
|
"valid_targets_mean": 3344.9,
|
|
"valid_targets_min": 608
|
|
},
|
|
{
|
|
"epoch": 1.4098837209302326,
|
|
"grad_norm": 0.557062845918987,
|
|
"learning_rate": 3.8766710327607275e-05,
|
|
"loss": 0.291,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1791156828403473,
|
|
"step": 970,
|
|
"valid_targets_mean": 4556.5,
|
|
"valid_targets_min": 563
|
|
},
|
|
{
|
|
"epoch": 1.4171511627906976,
|
|
"grad_norm": 0.5911823376876226,
|
|
"learning_rate": 3.874152643506202e-05,
|
|
"loss": 0.2785,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14642855525016785,
|
|
"step": 975,
|
|
"valid_targets_mean": 2476.5,
|
|
"valid_targets_min": 562
|
|
},
|
|
{
|
|
"epoch": 1.4244186046511627,
|
|
"grad_norm": 0.6477050154264477,
|
|
"learning_rate": 3.871609635477507e-05,
|
|
"loss": 0.3037,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17030063271522522,
|
|
"step": 980,
|
|
"valid_targets_mean": 3118.4,
|
|
"valid_targets_min": 690
|
|
},
|
|
{
|
|
"epoch": 1.431686046511628,
|
|
"grad_norm": 0.5264548444989446,
|
|
"learning_rate": 3.869042042079467e-05,
|
|
"loss": 0.2765,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12108216434717178,
|
|
"step": 985,
|
|
"valid_targets_mean": 3474.5,
|
|
"valid_targets_min": 569
|
|
},
|
|
{
|
|
"epoch": 1.4389534883720931,
|
|
"grad_norm": 0.5521838915160564,
|
|
"learning_rate": 3.866449897039859e-05,
|
|
"loss": 0.3149,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1818712055683136,
|
|
"step": 990,
|
|
"valid_targets_mean": 4667.5,
|
|
"valid_targets_min": 496
|
|
},
|
|
{
|
|
"epoch": 1.4462209302325582,
|
|
"grad_norm": 0.5572670157606036,
|
|
"learning_rate": 3.863833234408969e-05,
|
|
"loss": 0.2817,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0819392278790474,
|
|
"step": 995,
|
|
"valid_targets_mean": 1904.2,
|
|
"valid_targets_min": 507
|
|
},
|
|
{
|
|
"epoch": 1.4534883720930232,
|
|
"grad_norm": 0.5393974949240506,
|
|
"learning_rate": 3.861192088559144e-05,
|
|
"loss": 0.2881,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14820337295532227,
|
|
"step": 1000,
|
|
"valid_targets_mean": 3899.6,
|
|
"valid_targets_min": 696
|
|
},
|
|
{
|
|
"epoch": 1.4607558139534884,
|
|
"grad_norm": 0.5683915302410261,
|
|
"learning_rate": 3.858526494184344e-05,
|
|
"loss": 0.3142,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12288520485162735,
|
|
"step": 1005,
|
|
"valid_targets_mean": 2486.5,
|
|
"valid_targets_min": 483
|
|
},
|
|
{
|
|
"epoch": 1.4680232558139534,
|
|
"grad_norm": 0.5783311941630546,
|
|
"learning_rate": 3.8558364862996796e-05,
|
|
"loss": 0.2925,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13479480147361755,
|
|
"step": 1010,
|
|
"valid_targets_mean": 2884.5,
|
|
"valid_targets_min": 723
|
|
},
|
|
{
|
|
"epoch": 1.4752906976744187,
|
|
"grad_norm": 0.6207113680745554,
|
|
"learning_rate": 3.853122100240959e-05,
|
|
"loss": 0.3007,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16201730072498322,
|
|
"step": 1015,
|
|
"valid_targets_mean": 3314.5,
|
|
"valid_targets_min": 627
|
|
},
|
|
{
|
|
"epoch": 1.4825581395348837,
|
|
"grad_norm": 0.5494676329745364,
|
|
"learning_rate": 3.850383371664219e-05,
|
|
"loss": 0.2846,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14080458879470825,
|
|
"step": 1020,
|
|
"valid_targets_mean": 3708.6,
|
|
"valid_targets_min": 679
|
|
},
|
|
{
|
|
"epoch": 1.489825581395349,
|
|
"grad_norm": 0.5543402259634419,
|
|
"learning_rate": 3.8476203365452607e-05,
|
|
"loss": 0.2943,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14013566076755524,
|
|
"step": 1025,
|
|
"valid_targets_mean": 2788.2,
|
|
"valid_targets_min": 662
|
|
},
|
|
{
|
|
"epoch": 1.497093023255814,
|
|
"grad_norm": 0.5148659577451574,
|
|
"learning_rate": 3.8448330311791735e-05,
|
|
"loss": 0.2835,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16535460948944092,
|
|
"step": 1030,
|
|
"valid_targets_mean": 5268.8,
|
|
"valid_targets_min": 3758
|
|
},
|
|
{
|
|
"epoch": 1.504360465116279,
|
|
"grad_norm": 0.5245117965273571,
|
|
"learning_rate": 3.842021492179858e-05,
|
|
"loss": 0.2776,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10683688521385193,
|
|
"step": 1035,
|
|
"valid_targets_mean": 2680.6,
|
|
"valid_targets_min": 736
|
|
},
|
|
{
|
|
"epoch": 1.5116279069767442,
|
|
"grad_norm": 0.4994303593565894,
|
|
"learning_rate": 3.8391857564795494e-05,
|
|
"loss": 0.2699,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13968025147914886,
|
|
"step": 1040,
|
|
"valid_targets_mean": 4212.2,
|
|
"valid_targets_min": 534
|
|
},
|
|
{
|
|
"epoch": 1.5188953488372094,
|
|
"grad_norm": 0.598042521831162,
|
|
"learning_rate": 3.836325861328328e-05,
|
|
"loss": 0.2993,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1949174851179123,
|
|
"step": 1045,
|
|
"valid_targets_mean": 3461.8,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 1.5261627906976745,
|
|
"grad_norm": 0.5229294300773233,
|
|
"learning_rate": 3.83344184429363e-05,
|
|
"loss": 0.288,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14252832531929016,
|
|
"step": 1050,
|
|
"valid_targets_mean": 3490.0,
|
|
"valid_targets_min": 159
|
|
},
|
|
{
|
|
"epoch": 1.5334302325581395,
|
|
"grad_norm": 0.4725224756008864,
|
|
"learning_rate": 3.83053374325976e-05,
|
|
"loss": 0.2854,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15991975367069244,
|
|
"step": 1055,
|
|
"valid_targets_mean": 5041.9,
|
|
"valid_targets_min": 1040
|
|
},
|
|
{
|
|
"epoch": 1.5406976744186047,
|
|
"grad_norm": 0.4953697177639167,
|
|
"learning_rate": 3.827601596427383e-05,
|
|
"loss": 0.2798,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15688475966453552,
|
|
"step": 1060,
|
|
"valid_targets_mean": 4240.1,
|
|
"valid_targets_min": 881
|
|
},
|
|
{
|
|
"epoch": 1.5479651162790697,
|
|
"grad_norm": 0.5420901673992,
|
|
"learning_rate": 3.824645442313033e-05,
|
|
"loss": 0.2896,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1448085904121399,
|
|
"step": 1065,
|
|
"valid_targets_mean": 3815.6,
|
|
"valid_targets_min": 699
|
|
},
|
|
{
|
|
"epoch": 1.5552325581395348,
|
|
"grad_norm": 0.5260497967025354,
|
|
"learning_rate": 3.8216653197486004e-05,
|
|
"loss": 0.2821,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13990908861160278,
|
|
"step": 1070,
|
|
"valid_targets_mean": 4333.5,
|
|
"valid_targets_min": 620
|
|
},
|
|
{
|
|
"epoch": 1.5625,
|
|
"grad_norm": 0.49690016233693,
|
|
"learning_rate": 3.818661267880823e-05,
|
|
"loss": 0.3081,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1375221610069275,
|
|
"step": 1075,
|
|
"valid_targets_mean": 4047.8,
|
|
"valid_targets_min": 847
|
|
},
|
|
{
|
|
"epoch": 1.5697674418604652,
|
|
"grad_norm": 0.5168520175806998,
|
|
"learning_rate": 3.815633326170776e-05,
|
|
"loss": 0.2622,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10871457308530807,
|
|
"step": 1080,
|
|
"valid_targets_mean": 3121.6,
|
|
"valid_targets_min": 679
|
|
},
|
|
{
|
|
"epoch": 1.5770348837209303,
|
|
"grad_norm": 0.5329589909031591,
|
|
"learning_rate": 3.812581534393347e-05,
|
|
"loss": 0.2884,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1447029411792755,
|
|
"step": 1085,
|
|
"valid_targets_mean": 3910.0,
|
|
"valid_targets_min": 716
|
|
},
|
|
{
|
|
"epoch": 1.5843023255813953,
|
|
"grad_norm": 0.5281908929906156,
|
|
"learning_rate": 3.809505932636717e-05,
|
|
"loss": 0.2781,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16305357217788696,
|
|
"step": 1090,
|
|
"valid_targets_mean": 4355.1,
|
|
"valid_targets_min": 660
|
|
},
|
|
{
|
|
"epoch": 1.5915697674418605,
|
|
"grad_norm": 0.6180623277335446,
|
|
"learning_rate": 3.8064065613018376e-05,
|
|
"loss": 0.2836,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.151731476187706,
|
|
"step": 1095,
|
|
"valid_targets_mean": 3038.8,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 1.5988372093023255,
|
|
"grad_norm": 0.5003352743399826,
|
|
"learning_rate": 3.803283461101892e-05,
|
|
"loss": 0.2766,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14992684125900269,
|
|
"step": 1100,
|
|
"valid_targets_mean": 4808.9,
|
|
"valid_targets_min": 727
|
|
},
|
|
{
|
|
"epoch": 1.6061046511627906,
|
|
"grad_norm": 0.5582492530325496,
|
|
"learning_rate": 3.800136673061765e-05,
|
|
"loss": 0.2986,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15017104148864746,
|
|
"step": 1105,
|
|
"valid_targets_mean": 3318.8,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 1.6133720930232558,
|
|
"grad_norm": 0.48010674994635283,
|
|
"learning_rate": 3.796966238517508e-05,
|
|
"loss": 0.293,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09976556897163391,
|
|
"step": 1110,
|
|
"valid_targets_mean": 3718.4,
|
|
"valid_targets_min": 456
|
|
},
|
|
{
|
|
"epoch": 1.620639534883721,
|
|
"grad_norm": 0.47774041262137673,
|
|
"learning_rate": 3.793772199115786e-05,
|
|
"loss": 0.2996,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15033277869224548,
|
|
"step": 1115,
|
|
"valid_targets_mean": 4473.0,
|
|
"valid_targets_min": 635
|
|
},
|
|
{
|
|
"epoch": 1.627906976744186,
|
|
"grad_norm": 0.508476646299974,
|
|
"learning_rate": 3.790554596813339e-05,
|
|
"loss": 0.2827,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13769778609275818,
|
|
"step": 1120,
|
|
"valid_targets_mean": 3927.5,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 1.635174418604651,
|
|
"grad_norm": 0.5352158793527734,
|
|
"learning_rate": 3.787313473876429e-05,
|
|
"loss": 0.2793,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13205015659332275,
|
|
"step": 1125,
|
|
"valid_targets_mean": 3941.2,
|
|
"valid_targets_min": 741
|
|
},
|
|
{
|
|
"epoch": 1.6424418604651163,
|
|
"grad_norm": 0.551833691323417,
|
|
"learning_rate": 3.784048872880282e-05,
|
|
"loss": 0.2726,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14076612889766693,
|
|
"step": 1130,
|
|
"valid_targets_mean": 3053.6,
|
|
"valid_targets_min": 545
|
|
},
|
|
{
|
|
"epoch": 1.6497093023255816,
|
|
"grad_norm": 0.48623918737753347,
|
|
"learning_rate": 3.780760836708531e-05,
|
|
"loss": 0.2761,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1337115466594696,
|
|
"step": 1135,
|
|
"valid_targets_mean": 4660.6,
|
|
"valid_targets_min": 3615
|
|
},
|
|
{
|
|
"epoch": 1.6569767441860463,
|
|
"grad_norm": 0.5265160121639417,
|
|
"learning_rate": 3.777449408552653e-05,
|
|
"loss": 0.2861,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15630273520946503,
|
|
"step": 1140,
|
|
"valid_targets_mean": 3580.8,
|
|
"valid_targets_min": 709
|
|
},
|
|
{
|
|
"epoch": 1.6642441860465116,
|
|
"grad_norm": 0.6484297812170937,
|
|
"learning_rate": 3.774114631911401e-05,
|
|
"loss": 0.2841,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14704245328903198,
|
|
"step": 1145,
|
|
"valid_targets_mean": 3001.8,
|
|
"valid_targets_min": 697
|
|
},
|
|
{
|
|
"epoch": 1.6715116279069768,
|
|
"grad_norm": 0.477713717581914,
|
|
"learning_rate": 3.770756550590231e-05,
|
|
"loss": 0.2746,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12983140349388123,
|
|
"step": 1150,
|
|
"valid_targets_mean": 4782.8,
|
|
"valid_targets_min": 2777
|
|
},
|
|
{
|
|
"epoch": 1.6787790697674418,
|
|
"grad_norm": 0.5302430878469313,
|
|
"learning_rate": 3.767375208700729e-05,
|
|
"loss": 0.2878,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15250588953495026,
|
|
"step": 1155,
|
|
"valid_targets_mean": 3942.6,
|
|
"valid_targets_min": 578
|
|
},
|
|
{
|
|
"epoch": 1.6860465116279069,
|
|
"grad_norm": 1.0261147639745576,
|
|
"learning_rate": 3.763970650660032e-05,
|
|
"loss": 0.2849,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15077000856399536,
|
|
"step": 1160,
|
|
"valid_targets_mean": 4066.6,
|
|
"valid_targets_min": 766
|
|
},
|
|
{
|
|
"epoch": 1.693313953488372,
|
|
"grad_norm": 0.5350975912828917,
|
|
"learning_rate": 3.76054292119024e-05,
|
|
"loss": 0.2782,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12772193551063538,
|
|
"step": 1165,
|
|
"valid_targets_mean": 3557.6,
|
|
"valid_targets_min": 850
|
|
},
|
|
{
|
|
"epoch": 1.7005813953488373,
|
|
"grad_norm": 0.5502847590101302,
|
|
"learning_rate": 3.7570920653178355e-05,
|
|
"loss": 0.3035,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1232425644993782,
|
|
"step": 1170,
|
|
"valid_targets_mean": 2857.4,
|
|
"valid_targets_min": 626
|
|
},
|
|
{
|
|
"epoch": 1.7078488372093024,
|
|
"grad_norm": 0.5051049922272837,
|
|
"learning_rate": 3.753618128373086e-05,
|
|
"loss": 0.2802,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1397297978401184,
|
|
"step": 1175,
|
|
"valid_targets_mean": 4253.1,
|
|
"valid_targets_min": 496
|
|
},
|
|
{
|
|
"epoch": 1.7151162790697674,
|
|
"grad_norm": 0.5075044635586806,
|
|
"learning_rate": 3.75012115598945e-05,
|
|
"loss": 0.2834,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1724143773317337,
|
|
"step": 1180,
|
|
"valid_targets_mean": 4327.4,
|
|
"valid_targets_min": 532
|
|
},
|
|
{
|
|
"epoch": 1.7223837209302326,
|
|
"grad_norm": 0.5879909794286214,
|
|
"learning_rate": 3.7466011941029806e-05,
|
|
"loss": 0.2967,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17726115882396698,
|
|
"step": 1185,
|
|
"valid_targets_mean": 2947.8,
|
|
"valid_targets_min": 612
|
|
},
|
|
{
|
|
"epoch": 1.7296511627906976,
|
|
"grad_norm": 0.4971577954565775,
|
|
"learning_rate": 3.743058288951719e-05,
|
|
"loss": 0.2827,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12558473646640778,
|
|
"step": 1190,
|
|
"valid_targets_mean": 3530.9,
|
|
"valid_targets_min": 782
|
|
},
|
|
{
|
|
"epoch": 1.7369186046511627,
|
|
"grad_norm": 0.5910499715345675,
|
|
"learning_rate": 3.739492487075087e-05,
|
|
"loss": 0.2999,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18601062893867493,
|
|
"step": 1195,
|
|
"valid_targets_mean": 4114.2,
|
|
"valid_targets_min": 305
|
|
},
|
|
{
|
|
"epoch": 1.744186046511628,
|
|
"grad_norm": 0.6130589859372811,
|
|
"learning_rate": 3.735903835313278e-05,
|
|
"loss": 0.2705,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10830438137054443,
|
|
"step": 1200,
|
|
"valid_targets_mean": 4013.6,
|
|
"valid_targets_min": 727
|
|
},
|
|
{
|
|
"epoch": 1.7514534883720931,
|
|
"grad_norm": 0.498529960515945,
|
|
"learning_rate": 3.7322923808066394e-05,
|
|
"loss": 0.3053,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1307220160961151,
|
|
"step": 1205,
|
|
"valid_targets_mean": 3688.9,
|
|
"valid_targets_min": 624
|
|
},
|
|
{
|
|
"epoch": 1.7587209302325582,
|
|
"grad_norm": 0.5482650416789371,
|
|
"learning_rate": 3.728658170995055e-05,
|
|
"loss": 0.2919,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16106528043746948,
|
|
"step": 1210,
|
|
"valid_targets_mean": 3593.9,
|
|
"valid_targets_min": 768
|
|
},
|
|
{
|
|
"epoch": 1.7659883720930232,
|
|
"grad_norm": 0.5477151270821805,
|
|
"learning_rate": 3.72500125361732e-05,
|
|
"loss": 0.3008,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13051432371139526,
|
|
"step": 1215,
|
|
"valid_targets_mean": 2720.8,
|
|
"valid_targets_min": 729
|
|
},
|
|
{
|
|
"epoch": 1.7732558139534884,
|
|
"grad_norm": 0.4407679268853417,
|
|
"learning_rate": 3.7213216767105165e-05,
|
|
"loss": 0.2845,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13464666903018951,
|
|
"step": 1220,
|
|
"valid_targets_mean": 4206.9,
|
|
"valid_targets_min": 626
|
|
},
|
|
{
|
|
"epoch": 1.7805232558139537,
|
|
"grad_norm": 0.5940188606823525,
|
|
"learning_rate": 3.71761948860938e-05,
|
|
"loss": 0.2835,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14552396535873413,
|
|
"step": 1225,
|
|
"valid_targets_mean": 2963.9,
|
|
"valid_targets_min": 440
|
|
},
|
|
{
|
|
"epoch": 1.7877906976744184,
|
|
"grad_norm": 0.5095933376877391,
|
|
"learning_rate": 3.713894737945666e-05,
|
|
"loss": 0.2722,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13193480670452118,
|
|
"step": 1230,
|
|
"valid_targets_mean": 3336.2,
|
|
"valid_targets_min": 651
|
|
},
|
|
{
|
|
"epoch": 1.7950581395348837,
|
|
"grad_norm": 0.5624492527204488,
|
|
"learning_rate": 3.71014747364751e-05,
|
|
"loss": 0.2866,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17303186655044556,
|
|
"step": 1235,
|
|
"valid_targets_mean": 3972.0,
|
|
"valid_targets_min": 497
|
|
},
|
|
{
|
|
"epoch": 1.802325581395349,
|
|
"grad_norm": 0.48051926305800385,
|
|
"learning_rate": 3.7063777449387875e-05,
|
|
"loss": 0.2745,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10240213572978973,
|
|
"step": 1240,
|
|
"valid_targets_mean": 2702.4,
|
|
"valid_targets_min": 483
|
|
},
|
|
{
|
|
"epoch": 1.809593023255814,
|
|
"grad_norm": 0.5544074964305465,
|
|
"learning_rate": 3.702585601338461e-05,
|
|
"loss": 0.278,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14542116224765778,
|
|
"step": 1245,
|
|
"valid_targets_mean": 3104.0,
|
|
"valid_targets_min": 748
|
|
},
|
|
{
|
|
"epoch": 1.816860465116279,
|
|
"grad_norm": 0.4922917541072786,
|
|
"learning_rate": 3.698771092659939e-05,
|
|
"loss": 0.2868,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14152829349040985,
|
|
"step": 1250,
|
|
"valid_targets_mean": 3484.1,
|
|
"valid_targets_min": 760
|
|
},
|
|
{
|
|
"epoch": 1.8241279069767442,
|
|
"grad_norm": 0.5277454142458948,
|
|
"learning_rate": 3.694934269010414e-05,
|
|
"loss": 0.2821,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14739757776260376,
|
|
"step": 1255,
|
|
"valid_targets_mean": 4395.9,
|
|
"valid_targets_min": 774
|
|
},
|
|
{
|
|
"epoch": 1.8313953488372094,
|
|
"grad_norm": 0.5099127031213423,
|
|
"learning_rate": 3.691075180790207e-05,
|
|
"loss": 0.2845,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12729209661483765,
|
|
"step": 1260,
|
|
"valid_targets_mean": 3339.8,
|
|
"valid_targets_min": 692
|
|
},
|
|
{
|
|
"epoch": 1.8386627906976745,
|
|
"grad_norm": 0.9200745360414155,
|
|
"learning_rate": 3.6871938786921044e-05,
|
|
"loss": 0.2958,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14698383212089539,
|
|
"step": 1265,
|
|
"valid_targets_mean": 3025.5,
|
|
"valid_targets_min": 476
|
|
},
|
|
{
|
|
"epoch": 1.8459302325581395,
|
|
"grad_norm": 0.6084589743816421,
|
|
"learning_rate": 3.683290413700695e-05,
|
|
"loss": 0.2981,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15879669785499573,
|
|
"step": 1270,
|
|
"valid_targets_mean": 2718.5,
|
|
"valid_targets_min": 627
|
|
},
|
|
{
|
|
"epoch": 1.8531976744186047,
|
|
"grad_norm": 0.4727978345525131,
|
|
"learning_rate": 3.679364837091696e-05,
|
|
"loss": 0.2781,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.180962935090065,
|
|
"step": 1275,
|
|
"valid_targets_mean": 5369.4,
|
|
"valid_targets_min": 3737
|
|
},
|
|
{
|
|
"epoch": 1.8604651162790697,
|
|
"grad_norm": 0.4700331160562772,
|
|
"learning_rate": 3.675417200431284e-05,
|
|
"loss": 0.2835,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13727298378944397,
|
|
"step": 1280,
|
|
"valid_targets_mean": 4292.6,
|
|
"valid_targets_min": 820
|
|
},
|
|
{
|
|
"epoch": 1.8677325581395348,
|
|
"grad_norm": 0.4849236576687317,
|
|
"learning_rate": 3.671447555575413e-05,
|
|
"loss": 0.2816,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.127630814909935,
|
|
"step": 1285,
|
|
"valid_targets_mean": 3766.6,
|
|
"valid_targets_min": 620
|
|
},
|
|
{
|
|
"epoch": 1.875,
|
|
"grad_norm": 0.5276934366840089,
|
|
"learning_rate": 3.667455954669138e-05,
|
|
"loss": 0.2863,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15197885036468506,
|
|
"step": 1290,
|
|
"valid_targets_mean": 3873.1,
|
|
"valid_targets_min": 803
|
|
},
|
|
{
|
|
"epoch": 1.8822674418604652,
|
|
"grad_norm": 0.7132774309429776,
|
|
"learning_rate": 3.663442450145926e-05,
|
|
"loss": 0.2895,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1851046234369278,
|
|
"step": 1295,
|
|
"valid_targets_mean": 3551.5,
|
|
"valid_targets_min": 795
|
|
},
|
|
{
|
|
"epoch": 1.8895348837209303,
|
|
"grad_norm": 0.47800429867582084,
|
|
"learning_rate": 3.6594070947269675e-05,
|
|
"loss": 0.2821,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1899186372756958,
|
|
"step": 1300,
|
|
"valid_targets_mean": 5676.8,
|
|
"valid_targets_min": 4211
|
|
},
|
|
{
|
|
"epoch": 1.8968023255813953,
|
|
"grad_norm": 0.5684669309927136,
|
|
"learning_rate": 3.65534994142049e-05,
|
|
"loss": 0.2722,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1318185180425644,
|
|
"step": 1305,
|
|
"valid_targets_mean": 2172.1,
|
|
"valid_targets_min": 543
|
|
},
|
|
{
|
|
"epoch": 1.9040697674418605,
|
|
"grad_norm": 0.6094430087247472,
|
|
"learning_rate": 3.6512710435210496e-05,
|
|
"loss": 0.2936,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12776127457618713,
|
|
"step": 1310,
|
|
"valid_targets_mean": 2547.8,
|
|
"valid_targets_min": 509
|
|
},
|
|
{
|
|
"epoch": 1.9113372093023255,
|
|
"grad_norm": 0.7826305476307706,
|
|
"learning_rate": 3.647170454608846e-05,
|
|
"loss": 0.3016,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12746961414813995,
|
|
"step": 1315,
|
|
"valid_targets_mean": 3581.9,
|
|
"valid_targets_min": 707
|
|
},
|
|
{
|
|
"epoch": 1.9186046511627906,
|
|
"grad_norm": 0.5711124612833212,
|
|
"learning_rate": 3.643048228549006e-05,
|
|
"loss": 0.2843,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16838140785694122,
|
|
"step": 1320,
|
|
"valid_targets_mean": 3616.0,
|
|
"valid_targets_min": 696
|
|
},
|
|
{
|
|
"epoch": 1.9258720930232558,
|
|
"grad_norm": 1.088493409088202,
|
|
"learning_rate": 3.638904419490882e-05,
|
|
"loss": 0.3061,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15989214181900024,
|
|
"step": 1325,
|
|
"valid_targets_mean": 4129.2,
|
|
"valid_targets_min": 681
|
|
},
|
|
{
|
|
"epoch": 1.933139534883721,
|
|
"grad_norm": 0.5637639370882057,
|
|
"learning_rate": 3.6347390818673406e-05,
|
|
"loss": 0.2964,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13954320549964905,
|
|
"step": 1330,
|
|
"valid_targets_mean": 3279.0,
|
|
"valid_targets_min": 756
|
|
},
|
|
{
|
|
"epoch": 1.940406976744186,
|
|
"grad_norm": 0.5270815044047604,
|
|
"learning_rate": 3.6305522703940446e-05,
|
|
"loss": 0.2857,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14545057713985443,
|
|
"step": 1335,
|
|
"valid_targets_mean": 4070.2,
|
|
"valid_targets_min": 652
|
|
},
|
|
{
|
|
"epoch": 1.947674418604651,
|
|
"grad_norm": 0.5231244830899889,
|
|
"learning_rate": 3.626344040068738e-05,
|
|
"loss": 0.2818,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12065362930297852,
|
|
"step": 1340,
|
|
"valid_targets_mean": 2788.0,
|
|
"valid_targets_min": 621
|
|
},
|
|
{
|
|
"epoch": 1.9549418604651163,
|
|
"grad_norm": 0.48402756241669825,
|
|
"learning_rate": 3.622114446170522e-05,
|
|
"loss": 0.2838,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11438912153244019,
|
|
"step": 1345,
|
|
"valid_targets_mean": 3629.8,
|
|
"valid_targets_min": 636
|
|
},
|
|
{
|
|
"epoch": 1.9622093023255816,
|
|
"grad_norm": 0.4797720882059406,
|
|
"learning_rate": 3.617863544259127e-05,
|
|
"loss": 0.2717,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13530614972114563,
|
|
"step": 1350,
|
|
"valid_targets_mean": 4314.6,
|
|
"valid_targets_min": 907
|
|
},
|
|
{
|
|
"epoch": 1.9694767441860463,
|
|
"grad_norm": 0.4840730467813608,
|
|
"learning_rate": 3.613591390174185e-05,
|
|
"loss": 0.2658,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13704459369182587,
|
|
"step": 1355,
|
|
"valid_targets_mean": 3770.6,
|
|
"valid_targets_min": 856
|
|
},
|
|
{
|
|
"epoch": 1.9767441860465116,
|
|
"grad_norm": 0.5333319045054723,
|
|
"learning_rate": 3.609298040034496e-05,
|
|
"loss": 0.2737,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10413102060556412,
|
|
"step": 1360,
|
|
"valid_targets_mean": 2400.1,
|
|
"valid_targets_min": 467
|
|
},
|
|
{
|
|
"epoch": 1.9840116279069768,
|
|
"grad_norm": 0.5848922636884715,
|
|
"learning_rate": 3.6049835502372894e-05,
|
|
"loss": 0.2996,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1518581211566925,
|
|
"step": 1365,
|
|
"valid_targets_mean": 3005.8,
|
|
"valid_targets_min": 129
|
|
},
|
|
{
|
|
"epoch": 1.9912790697674418,
|
|
"grad_norm": 0.47721552430914416,
|
|
"learning_rate": 3.6006479774574846e-05,
|
|
"loss": 0.2752,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13737758994102478,
|
|
"step": 1370,
|
|
"valid_targets_mean": 4180.2,
|
|
"valid_targets_min": 994
|
|
},
|
|
{
|
|
"epoch": 1.9985465116279069,
|
|
"grad_norm": 0.5364106208178079,
|
|
"learning_rate": 3.596291378646947e-05,
|
|
"loss": 0.276,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09656524658203125,
|
|
"step": 1375,
|
|
"valid_targets_mean": 1684.8,
|
|
"valid_targets_min": 516
|
|
},
|
|
{
|
|
"epoch": 2.005813953488372,
|
|
"grad_norm": 0.5376377641998679,
|
|
"learning_rate": 3.591913811033736e-05,
|
|
"loss": 0.2784,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08827735483646393,
|
|
"step": 1380,
|
|
"valid_targets_mean": 2703.1,
|
|
"valid_targets_min": 374
|
|
},
|
|
{
|
|
"epoch": 2.0130813953488373,
|
|
"grad_norm": 0.5848775272946124,
|
|
"learning_rate": 3.58751533212136e-05,
|
|
"loss": 0.2654,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18071289360523224,
|
|
"step": 1385,
|
|
"valid_targets_mean": 3698.2,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 2.020348837209302,
|
|
"grad_norm": 0.5127749221390476,
|
|
"learning_rate": 3.5830959996880134e-05,
|
|
"loss": 0.263,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15570735931396484,
|
|
"step": 1390,
|
|
"valid_targets_mean": 4655.9,
|
|
"valid_targets_min": 948
|
|
},
|
|
{
|
|
"epoch": 2.0276162790697674,
|
|
"grad_norm": 0.4743043393339027,
|
|
"learning_rate": 3.578655871785824e-05,
|
|
"loss": 0.2709,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1249096691608429,
|
|
"step": 1395,
|
|
"valid_targets_mean": 4346.9,
|
|
"valid_targets_min": 765
|
|
},
|
|
{
|
|
"epoch": 2.0348837209302326,
|
|
"grad_norm": 0.49366831615834167,
|
|
"learning_rate": 3.574195006740087e-05,
|
|
"loss": 0.2538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12072114646434784,
|
|
"step": 1400,
|
|
"valid_targets_mean": 4137.4,
|
|
"valid_targets_min": 719
|
|
},
|
|
{
|
|
"epoch": 2.042151162790698,
|
|
"grad_norm": 0.49849763580575895,
|
|
"learning_rate": 3.5697134631485e-05,
|
|
"loss": 0.2547,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11655795574188232,
|
|
"step": 1405,
|
|
"valid_targets_mean": 4410.6,
|
|
"valid_targets_min": 1031
|
|
},
|
|
{
|
|
"epoch": 2.0494186046511627,
|
|
"grad_norm": 0.5234158764293848,
|
|
"learning_rate": 3.5652112998803914e-05,
|
|
"loss": 0.2763,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12006824463605881,
|
|
"step": 1410,
|
|
"valid_targets_mean": 3905.4,
|
|
"valid_targets_min": 855
|
|
},
|
|
{
|
|
"epoch": 2.056686046511628,
|
|
"grad_norm": 0.4846891544610793,
|
|
"learning_rate": 3.560688576075951e-05,
|
|
"loss": 0.2538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14693428575992584,
|
|
"step": 1415,
|
|
"valid_targets_mean": 4482.4,
|
|
"valid_targets_min": 448
|
|
},
|
|
{
|
|
"epoch": 2.063953488372093,
|
|
"grad_norm": 0.47199386841521335,
|
|
"learning_rate": 3.5561453511454485e-05,
|
|
"loss": 0.278,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11529761552810669,
|
|
"step": 1420,
|
|
"valid_targets_mean": 4109.1,
|
|
"valid_targets_min": 1126
|
|
},
|
|
{
|
|
"epoch": 2.071220930232558,
|
|
"grad_norm": 0.48678567559248875,
|
|
"learning_rate": 3.551581684768457e-05,
|
|
"loss": 0.2647,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1414426863193512,
|
|
"step": 1425,
|
|
"valid_targets_mean": 4217.1,
|
|
"valid_targets_min": 634
|
|
},
|
|
{
|
|
"epoch": 2.078488372093023,
|
|
"grad_norm": 0.6118910096762987,
|
|
"learning_rate": 3.546997636893067e-05,
|
|
"loss": 0.2699,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10148027539253235,
|
|
"step": 1430,
|
|
"valid_targets_mean": 2007.8,
|
|
"valid_targets_min": 487
|
|
},
|
|
{
|
|
"epoch": 2.0857558139534884,
|
|
"grad_norm": 0.5224485792193987,
|
|
"learning_rate": 3.542393267735098e-05,
|
|
"loss": 0.2725,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1559983342885971,
|
|
"step": 1435,
|
|
"valid_targets_mean": 4773.1,
|
|
"valid_targets_min": 908
|
|
},
|
|
{
|
|
"epoch": 2.0930232558139537,
|
|
"grad_norm": 0.554028772115384,
|
|
"learning_rate": 3.537768637777312e-05,
|
|
"loss": 0.2795,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19308879971504211,
|
|
"step": 1440,
|
|
"valid_targets_mean": 4352.8,
|
|
"valid_targets_min": 741
|
|
},
|
|
{
|
|
"epoch": 2.1002906976744184,
|
|
"grad_norm": 0.4621989703112275,
|
|
"learning_rate": 3.533123807768612e-05,
|
|
"loss": 0.2609,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1113363653421402,
|
|
"step": 1445,
|
|
"valid_targets_mean": 3969.4,
|
|
"valid_targets_min": 773
|
|
},
|
|
{
|
|
"epoch": 2.1075581395348837,
|
|
"grad_norm": 0.49525226186923427,
|
|
"learning_rate": 3.52845883872325e-05,
|
|
"loss": 0.2708,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.135954812169075,
|
|
"step": 1450,
|
|
"valid_targets_mean": 4239.1,
|
|
"valid_targets_min": 890
|
|
},
|
|
{
|
|
"epoch": 2.114825581395349,
|
|
"grad_norm": 0.5536797366019663,
|
|
"learning_rate": 3.523773791920023e-05,
|
|
"loss": 0.2636,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1700039952993393,
|
|
"step": 1455,
|
|
"valid_targets_mean": 3623.2,
|
|
"valid_targets_min": 670
|
|
},
|
|
{
|
|
"epoch": 2.1220930232558137,
|
|
"grad_norm": 0.5583987169370682,
|
|
"learning_rate": 3.51906872890147e-05,
|
|
"loss": 0.267,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11081169545650482,
|
|
"step": 1460,
|
|
"valid_targets_mean": 3194.4,
|
|
"valid_targets_min": 766
|
|
},
|
|
{
|
|
"epoch": 2.129360465116279,
|
|
"grad_norm": 0.675993039275515,
|
|
"learning_rate": 3.514343711473058e-05,
|
|
"loss": 0.2655,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12630599737167358,
|
|
"step": 1465,
|
|
"valid_targets_mean": 2452.6,
|
|
"valid_targets_min": 614
|
|
},
|
|
{
|
|
"epoch": 2.136627906976744,
|
|
"grad_norm": 0.5146630082127743,
|
|
"learning_rate": 3.509598801702378e-05,
|
|
"loss": 0.2563,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1256990283727646,
|
|
"step": 1470,
|
|
"valid_targets_mean": 3438.5,
|
|
"valid_targets_min": 595
|
|
},
|
|
{
|
|
"epoch": 2.1438953488372094,
|
|
"grad_norm": 0.4820414562746019,
|
|
"learning_rate": 3.504834061918324e-05,
|
|
"loss": 0.2591,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13081446290016174,
|
|
"step": 1475,
|
|
"valid_targets_mean": 3915.8,
|
|
"valid_targets_min": 814
|
|
},
|
|
{
|
|
"epoch": 2.1511627906976742,
|
|
"grad_norm": 0.5260061998630678,
|
|
"learning_rate": 3.5000495547102766e-05,
|
|
"loss": 0.2664,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13811007142066956,
|
|
"step": 1480,
|
|
"valid_targets_mean": 4041.0,
|
|
"valid_targets_min": 788
|
|
},
|
|
{
|
|
"epoch": 2.1584302325581395,
|
|
"grad_norm": 0.5293063498281043,
|
|
"learning_rate": 3.49524534292728e-05,
|
|
"loss": 0.2625,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1273302435874939,
|
|
"step": 1485,
|
|
"valid_targets_mean": 3316.5,
|
|
"valid_targets_min": 459
|
|
},
|
|
{
|
|
"epoch": 2.1656976744186047,
|
|
"grad_norm": 0.5661275028710806,
|
|
"learning_rate": 3.490421489677217e-05,
|
|
"loss": 0.2644,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11345352232456207,
|
|
"step": 1490,
|
|
"valid_targets_mean": 2989.9,
|
|
"valid_targets_min": 534
|
|
},
|
|
{
|
|
"epoch": 2.17296511627907,
|
|
"grad_norm": 0.5426548944493367,
|
|
"learning_rate": 3.485578058325979e-05,
|
|
"loss": 0.2737,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10773831605911255,
|
|
"step": 1495,
|
|
"valid_targets_mean": 2618.4,
|
|
"valid_targets_min": 796
|
|
},
|
|
{
|
|
"epoch": 2.1802325581395348,
|
|
"grad_norm": 0.5358415375531889,
|
|
"learning_rate": 3.480715112496634e-05,
|
|
"loss": 0.2628,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12474462389945984,
|
|
"step": 1500,
|
|
"valid_targets_mean": 3247.8,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 2.1875,
|
|
"grad_norm": 0.5091256086283701,
|
|
"learning_rate": 3.475832716068595e-05,
|
|
"loss": 0.2624,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1339842975139618,
|
|
"step": 1505,
|
|
"valid_targets_mean": 3784.9,
|
|
"valid_targets_min": 612
|
|
},
|
|
{
|
|
"epoch": 2.1947674418604652,
|
|
"grad_norm": 0.4526849642798776,
|
|
"learning_rate": 3.47093093317677e-05,
|
|
"loss": 0.2595,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12192752957344055,
|
|
"step": 1510,
|
|
"valid_targets_mean": 4210.1,
|
|
"valid_targets_min": 763
|
|
},
|
|
{
|
|
"epoch": 2.20203488372093,
|
|
"grad_norm": 0.6418251014891065,
|
|
"learning_rate": 3.4660098282107344e-05,
|
|
"loss": 0.2653,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17555320262908936,
|
|
"step": 1515,
|
|
"valid_targets_mean": 3093.1,
|
|
"valid_targets_min": 571
|
|
},
|
|
{
|
|
"epoch": 2.2093023255813953,
|
|
"grad_norm": 0.4978248898803813,
|
|
"learning_rate": 3.461069465813871e-05,
|
|
"loss": 0.2725,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14208854734897614,
|
|
"step": 1520,
|
|
"valid_targets_mean": 3839.2,
|
|
"valid_targets_min": 804
|
|
},
|
|
{
|
|
"epoch": 2.2165697674418605,
|
|
"grad_norm": 0.48938820010360695,
|
|
"learning_rate": 3.4561099108825323e-05,
|
|
"loss": 0.2703,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09456305205821991,
|
|
"step": 1525,
|
|
"valid_targets_mean": 3440.4,
|
|
"valid_targets_min": 665
|
|
},
|
|
{
|
|
"epoch": 2.2238372093023258,
|
|
"grad_norm": 0.5494920221285224,
|
|
"learning_rate": 3.451131228565179e-05,
|
|
"loss": 0.2625,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09877356886863708,
|
|
"step": 1530,
|
|
"valid_targets_mean": 2651.8,
|
|
"valid_targets_min": 658
|
|
},
|
|
{
|
|
"epoch": 2.2311046511627906,
|
|
"grad_norm": 0.49439302152720127,
|
|
"learning_rate": 3.446133484261529e-05,
|
|
"loss": 0.276,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17575523257255554,
|
|
"step": 1535,
|
|
"valid_targets_mean": 4729.0,
|
|
"valid_targets_min": 3501
|
|
},
|
|
{
|
|
"epoch": 2.238372093023256,
|
|
"grad_norm": 0.5307421275306936,
|
|
"learning_rate": 3.4411167436217004e-05,
|
|
"loss": 0.2742,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16329185664653778,
|
|
"step": 1540,
|
|
"valid_targets_mean": 4051.8,
|
|
"valid_targets_min": 693
|
|
},
|
|
{
|
|
"epoch": 2.245639534883721,
|
|
"grad_norm": 0.5270385519838316,
|
|
"learning_rate": 3.436081072545343e-05,
|
|
"loss": 0.2636,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14654135704040527,
|
|
"step": 1545,
|
|
"valid_targets_mean": 3702.0,
|
|
"valid_targets_min": 546
|
|
},
|
|
{
|
|
"epoch": 2.2529069767441863,
|
|
"grad_norm": 0.5552539214544302,
|
|
"learning_rate": 3.4310265371807775e-05,
|
|
"loss": 0.276,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10971195250749588,
|
|
"step": 1550,
|
|
"valid_targets_mean": 2676.8,
|
|
"valid_targets_min": 562
|
|
},
|
|
{
|
|
"epoch": 2.260174418604651,
|
|
"grad_norm": 0.5352876944143984,
|
|
"learning_rate": 3.4259532039241234e-05,
|
|
"loss": 0.2708,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13568298518657684,
|
|
"step": 1555,
|
|
"valid_targets_mean": 3398.1,
|
|
"valid_targets_min": 767
|
|
},
|
|
{
|
|
"epoch": 2.2674418604651163,
|
|
"grad_norm": 0.4369482033410833,
|
|
"learning_rate": 3.420861139418429e-05,
|
|
"loss": 0.2662,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1382427215576172,
|
|
"step": 1560,
|
|
"valid_targets_mean": 5266.9,
|
|
"valid_targets_min": 809
|
|
},
|
|
{
|
|
"epoch": 2.2747093023255816,
|
|
"grad_norm": 0.515678213997273,
|
|
"learning_rate": 3.4157504105527976e-05,
|
|
"loss": 0.2667,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16098284721374512,
|
|
"step": 1565,
|
|
"valid_targets_mean": 4429.6,
|
|
"valid_targets_min": 758
|
|
},
|
|
{
|
|
"epoch": 2.2819767441860463,
|
|
"grad_norm": 0.5097940592273604,
|
|
"learning_rate": 3.410621084461503e-05,
|
|
"loss": 0.2877,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14763861894607544,
|
|
"step": 1570,
|
|
"valid_targets_mean": 3918.2,
|
|
"valid_targets_min": 759
|
|
},
|
|
{
|
|
"epoch": 2.2892441860465116,
|
|
"grad_norm": 0.534212765089729,
|
|
"learning_rate": 3.405473228523114e-05,
|
|
"loss": 0.2639,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12504583597183228,
|
|
"step": 1575,
|
|
"valid_targets_mean": 3447.0,
|
|
"valid_targets_min": 711
|
|
},
|
|
{
|
|
"epoch": 2.296511627906977,
|
|
"grad_norm": 0.45809911560904876,
|
|
"learning_rate": 3.4003069103596034e-05,
|
|
"loss": 0.2711,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12107375264167786,
|
|
"step": 1580,
|
|
"valid_targets_mean": 4068.2,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 2.303779069767442,
|
|
"grad_norm": 0.5058709902336606,
|
|
"learning_rate": 3.395122197835467e-05,
|
|
"loss": 0.2722,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09252685308456421,
|
|
"step": 1585,
|
|
"valid_targets_mean": 2139.4,
|
|
"valid_targets_min": 524
|
|
},
|
|
{
|
|
"epoch": 2.311046511627907,
|
|
"grad_norm": 0.4841137765066096,
|
|
"learning_rate": 3.389919159056825e-05,
|
|
"loss": 0.2656,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13058248162269592,
|
|
"step": 1590,
|
|
"valid_targets_mean": 3712.4,
|
|
"valid_targets_min": 587
|
|
},
|
|
{
|
|
"epoch": 2.318313953488372,
|
|
"grad_norm": 0.6314252709339271,
|
|
"learning_rate": 3.384697862370531e-05,
|
|
"loss": 0.2731,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12193869054317474,
|
|
"step": 1595,
|
|
"valid_targets_mean": 4012.1,
|
|
"valid_targets_min": 689
|
|
},
|
|
{
|
|
"epoch": 2.3255813953488373,
|
|
"grad_norm": 0.4791491037613609,
|
|
"learning_rate": 3.379458376363274e-05,
|
|
"loss": 0.2588,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11508563160896301,
|
|
"step": 1600,
|
|
"valid_targets_mean": 3614.6,
|
|
"valid_targets_min": 876
|
|
},
|
|
{
|
|
"epoch": 2.332848837209302,
|
|
"grad_norm": 0.4932888283945881,
|
|
"learning_rate": 3.374200769860676e-05,
|
|
"loss": 0.2614,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1386955976486206,
|
|
"step": 1605,
|
|
"valid_targets_mean": 4039.6,
|
|
"valid_targets_min": 301
|
|
},
|
|
{
|
|
"epoch": 2.3401162790697674,
|
|
"grad_norm": 0.549901709584174,
|
|
"learning_rate": 3.368925111926391e-05,
|
|
"loss": 0.2749,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1280840039253235,
|
|
"step": 1610,
|
|
"valid_targets_mean": 3070.8,
|
|
"valid_targets_min": 652
|
|
},
|
|
{
|
|
"epoch": 2.3473837209302326,
|
|
"grad_norm": 0.5945830691027769,
|
|
"learning_rate": 3.363631471861194e-05,
|
|
"loss": 0.2697,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09050530195236206,
|
|
"step": 1615,
|
|
"valid_targets_mean": 1939.2,
|
|
"valid_targets_min": 508
|
|
},
|
|
{
|
|
"epoch": 2.354651162790698,
|
|
"grad_norm": 0.4744283976817756,
|
|
"learning_rate": 3.358319919202071e-05,
|
|
"loss": 0.2671,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11523960530757904,
|
|
"step": 1620,
|
|
"valid_targets_mean": 4096.6,
|
|
"valid_targets_min": 645
|
|
},
|
|
{
|
|
"epoch": 2.3619186046511627,
|
|
"grad_norm": 0.4847224210381442,
|
|
"learning_rate": 3.35299052372131e-05,
|
|
"loss": 0.2756,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13617539405822754,
|
|
"step": 1625,
|
|
"valid_targets_mean": 3855.5,
|
|
"valid_targets_min": 1132
|
|
},
|
|
{
|
|
"epoch": 2.369186046511628,
|
|
"grad_norm": 0.49840708948568,
|
|
"learning_rate": 3.3476433554255806e-05,
|
|
"loss": 0.2824,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1390097290277481,
|
|
"step": 1630,
|
|
"valid_targets_mean": 3952.4,
|
|
"valid_targets_min": 748
|
|
},
|
|
{
|
|
"epoch": 2.376453488372093,
|
|
"grad_norm": 0.5001556376410387,
|
|
"learning_rate": 3.342278484555014e-05,
|
|
"loss": 0.2686,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13502594828605652,
|
|
"step": 1635,
|
|
"valid_targets_mean": 3625.5,
|
|
"valid_targets_min": 597
|
|
},
|
|
{
|
|
"epoch": 2.383720930232558,
|
|
"grad_norm": 0.635635101849715,
|
|
"learning_rate": 3.336895981582282e-05,
|
|
"loss": 0.2863,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13348835706710815,
|
|
"step": 1640,
|
|
"valid_targets_mean": 2283.8,
|
|
"valid_targets_min": 760
|
|
},
|
|
{
|
|
"epoch": 2.390988372093023,
|
|
"grad_norm": 0.5264719953651338,
|
|
"learning_rate": 3.3314959172116705e-05,
|
|
"loss": 0.2655,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09972628951072693,
|
|
"step": 1645,
|
|
"valid_targets_mean": 2570.2,
|
|
"valid_targets_min": 592
|
|
},
|
|
{
|
|
"epoch": 2.3982558139534884,
|
|
"grad_norm": 0.832672751160306,
|
|
"learning_rate": 3.326078362378152e-05,
|
|
"loss": 0.2635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14847052097320557,
|
|
"step": 1650,
|
|
"valid_targets_mean": 3953.1,
|
|
"valid_targets_min": 720
|
|
},
|
|
{
|
|
"epoch": 2.4055232558139537,
|
|
"grad_norm": 0.5583772379822669,
|
|
"learning_rate": 3.320643388246452e-05,
|
|
"loss": 0.255,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1574249118566513,
|
|
"step": 1655,
|
|
"valid_targets_mean": 3535.5,
|
|
"valid_targets_min": 799
|
|
},
|
|
{
|
|
"epoch": 2.4127906976744184,
|
|
"grad_norm": 0.5046469808226955,
|
|
"learning_rate": 3.315191066210117e-05,
|
|
"loss": 0.2727,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16248942911624908,
|
|
"step": 1660,
|
|
"valid_targets_mean": 4482.1,
|
|
"valid_targets_min": 614
|
|
},
|
|
{
|
|
"epoch": 2.4200581395348837,
|
|
"grad_norm": 0.5294602291358438,
|
|
"learning_rate": 3.309721467890571e-05,
|
|
"loss": 0.2738,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1385262906551361,
|
|
"step": 1665,
|
|
"valid_targets_mean": 3637.4,
|
|
"valid_targets_min": 536
|
|
},
|
|
{
|
|
"epoch": 2.427325581395349,
|
|
"grad_norm": 0.4704899630611958,
|
|
"learning_rate": 3.3042346651361804e-05,
|
|
"loss": 0.264,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11646417528390884,
|
|
"step": 1670,
|
|
"valid_targets_mean": 3672.1,
|
|
"valid_targets_min": 692
|
|
},
|
|
{
|
|
"epoch": 2.4345930232558137,
|
|
"grad_norm": 0.5379513628865499,
|
|
"learning_rate": 3.298730730021309e-05,
|
|
"loss": 0.2645,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1307636946439743,
|
|
"step": 1675,
|
|
"valid_targets_mean": 3688.2,
|
|
"valid_targets_min": 510
|
|
},
|
|
{
|
|
"epoch": 2.441860465116279,
|
|
"grad_norm": 0.5717757647803172,
|
|
"learning_rate": 3.2932097348453696e-05,
|
|
"loss": 0.2736,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13288994133472443,
|
|
"step": 1680,
|
|
"valid_targets_mean": 2601.6,
|
|
"valid_targets_min": 551
|
|
},
|
|
{
|
|
"epoch": 2.449127906976744,
|
|
"grad_norm": 0.5799851581117721,
|
|
"learning_rate": 3.287671752131875e-05,
|
|
"loss": 0.264,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12425574660301208,
|
|
"step": 1685,
|
|
"valid_targets_mean": 2572.4,
|
|
"valid_targets_min": 509
|
|
},
|
|
{
|
|
"epoch": 2.4563953488372094,
|
|
"grad_norm": 0.5051100514029051,
|
|
"learning_rate": 3.282116854627485e-05,
|
|
"loss": 0.2756,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12104862928390503,
|
|
"step": 1690,
|
|
"valid_targets_mean": 3290.8,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 2.4636627906976742,
|
|
"grad_norm": 0.4884476414997209,
|
|
"learning_rate": 3.276545115301053e-05,
|
|
"loss": 0.2739,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14237235486507416,
|
|
"step": 1695,
|
|
"valid_targets_mean": 4186.4,
|
|
"valid_targets_min": 861
|
|
},
|
|
{
|
|
"epoch": 2.4709302325581395,
|
|
"grad_norm": 0.453706781086496,
|
|
"learning_rate": 3.270956607342663e-05,
|
|
"loss": 0.2682,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1469501554965973,
|
|
"step": 1700,
|
|
"valid_targets_mean": 4740.9,
|
|
"valid_targets_min": 546
|
|
},
|
|
{
|
|
"epoch": 2.4781976744186047,
|
|
"grad_norm": 0.588829728213914,
|
|
"learning_rate": 3.265351404162673e-05,
|
|
"loss": 0.2761,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09756440669298172,
|
|
"step": 1705,
|
|
"valid_targets_mean": 2120.9,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 2.4854651162790695,
|
|
"grad_norm": 0.4613022019381626,
|
|
"learning_rate": 3.259729579390749e-05,
|
|
"loss": 0.2635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11998298764228821,
|
|
"step": 1710,
|
|
"valid_targets_mean": 4440.6,
|
|
"valid_targets_min": 685
|
|
},
|
|
{
|
|
"epoch": 2.4927325581395348,
|
|
"grad_norm": 0.5431743435441446,
|
|
"learning_rate": 3.254091206874895e-05,
|
|
"loss": 0.276,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1468546837568283,
|
|
"step": 1715,
|
|
"valid_targets_mean": 3191.4,
|
|
"valid_targets_min": 819
|
|
},
|
|
{
|
|
"epoch": 2.5,
|
|
"grad_norm": 0.45513843549770333,
|
|
"learning_rate": 3.248436360680487e-05,
|
|
"loss": 0.2559,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14219807088375092,
|
|
"step": 1720,
|
|
"valid_targets_mean": 4397.4,
|
|
"valid_targets_min": 1024
|
|
},
|
|
{
|
|
"epoch": 2.5072674418604652,
|
|
"grad_norm": 0.5024140936757149,
|
|
"learning_rate": 3.2427651150892984e-05,
|
|
"loss": 0.2675,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15499092638492584,
|
|
"step": 1725,
|
|
"valid_targets_mean": 4194.4,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 2.5145348837209305,
|
|
"grad_norm": 0.4698206860809935,
|
|
"learning_rate": 3.237077544598524e-05,
|
|
"loss": 0.2744,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12705135345458984,
|
|
"step": 1730,
|
|
"valid_targets_mean": 3559.4,
|
|
"valid_targets_min": 559
|
|
},
|
|
{
|
|
"epoch": 2.5218023255813953,
|
|
"grad_norm": 0.46964481606078307,
|
|
"learning_rate": 3.2313737239198015e-05,
|
|
"loss": 0.2737,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14902839064598083,
|
|
"step": 1735,
|
|
"valid_targets_mean": 4454.0,
|
|
"valid_targets_min": 575
|
|
},
|
|
{
|
|
"epoch": 2.5290697674418605,
|
|
"grad_norm": 0.5092078095756714,
|
|
"learning_rate": 3.22565372797823e-05,
|
|
"loss": 0.2661,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13162916898727417,
|
|
"step": 1740,
|
|
"valid_targets_mean": 4042.2,
|
|
"valid_targets_min": 796
|
|
},
|
|
{
|
|
"epoch": 2.5363372093023253,
|
|
"grad_norm": 0.4532399507806315,
|
|
"learning_rate": 3.219917631911387e-05,
|
|
"loss": 0.2655,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12575411796569824,
|
|
"step": 1745,
|
|
"valid_targets_mean": 4582.4,
|
|
"valid_targets_min": 765
|
|
},
|
|
{
|
|
"epoch": 2.5436046511627906,
|
|
"grad_norm": 0.4970025077230629,
|
|
"learning_rate": 3.2141655110683396e-05,
|
|
"loss": 0.2567,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1303708553314209,
|
|
"step": 1750,
|
|
"valid_targets_mean": 3502.8,
|
|
"valid_targets_min": 596
|
|
},
|
|
{
|
|
"epoch": 2.550872093023256,
|
|
"grad_norm": 0.46718017929321,
|
|
"learning_rate": 3.208397441008655e-05,
|
|
"loss": 0.2611,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11836321651935577,
|
|
"step": 1755,
|
|
"valid_targets_mean": 4335.2,
|
|
"valid_targets_min": 884
|
|
},
|
|
{
|
|
"epoch": 2.558139534883721,
|
|
"grad_norm": 0.4799250453339413,
|
|
"learning_rate": 3.20261349750141e-05,
|
|
"loss": 0.2708,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1215079128742218,
|
|
"step": 1760,
|
|
"valid_targets_mean": 3528.9,
|
|
"valid_targets_min": 678
|
|
},
|
|
{
|
|
"epoch": 2.5654069767441863,
|
|
"grad_norm": 0.45115735719212735,
|
|
"learning_rate": 3.1968137565241936e-05,
|
|
"loss": 0.2718,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1389511227607727,
|
|
"step": 1765,
|
|
"valid_targets_mean": 4299.8,
|
|
"valid_targets_min": 547
|
|
},
|
|
{
|
|
"epoch": 2.572674418604651,
|
|
"grad_norm": 0.46289799998348813,
|
|
"learning_rate": 3.1909982942621085e-05,
|
|
"loss": 0.2613,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12753698229789734,
|
|
"step": 1770,
|
|
"valid_targets_mean": 4688.4,
|
|
"valid_targets_min": 4064
|
|
},
|
|
{
|
|
"epoch": 2.5799418604651163,
|
|
"grad_norm": 0.5129108516304612,
|
|
"learning_rate": 3.185167187106774e-05,
|
|
"loss": 0.2698,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19303864240646362,
|
|
"step": 1775,
|
|
"valid_targets_mean": 4826.6,
|
|
"valid_targets_min": 580
|
|
},
|
|
{
|
|
"epoch": 2.5872093023255816,
|
|
"grad_norm": 0.468090560312537,
|
|
"learning_rate": 3.179320511655317e-05,
|
|
"loss": 0.2575,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11583010852336884,
|
|
"step": 1780,
|
|
"valid_targets_mean": 3707.1,
|
|
"valid_targets_min": 666
|
|
},
|
|
{
|
|
"epoch": 2.5944767441860463,
|
|
"grad_norm": 0.4703450689865459,
|
|
"learning_rate": 3.1734583447093696e-05,
|
|
"loss": 0.2739,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12104140222072601,
|
|
"step": 1785,
|
|
"valid_targets_mean": 4700.1,
|
|
"valid_targets_min": 4102
|
|
},
|
|
{
|
|
"epoch": 2.6017441860465116,
|
|
"grad_norm": 0.4869676856169924,
|
|
"learning_rate": 3.167580763274061e-05,
|
|
"loss": 0.2731,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16636613011360168,
|
|
"step": 1790,
|
|
"valid_targets_mean": 4863.0,
|
|
"valid_targets_min": 1046
|
|
},
|
|
{
|
|
"epoch": 2.609011627906977,
|
|
"grad_norm": 0.4709917726328331,
|
|
"learning_rate": 3.161687844557002e-05,
|
|
"loss": 0.2573,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1224159300327301,
|
|
"step": 1795,
|
|
"valid_targets_mean": 3573.0,
|
|
"valid_targets_min": 581
|
|
},
|
|
{
|
|
"epoch": 2.616279069767442,
|
|
"grad_norm": 0.5171426552209677,
|
|
"learning_rate": 3.155779665967275e-05,
|
|
"loss": 0.2628,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11179779469966888,
|
|
"step": 1800,
|
|
"valid_targets_mean": 2782.5,
|
|
"valid_targets_min": 743
|
|
},
|
|
{
|
|
"epoch": 2.623546511627907,
|
|
"grad_norm": 0.6081646224080811,
|
|
"learning_rate": 3.149856305114416e-05,
|
|
"loss": 0.2543,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10924814641475677,
|
|
"step": 1805,
|
|
"valid_targets_mean": 2735.4,
|
|
"valid_targets_min": 477
|
|
},
|
|
{
|
|
"epoch": 2.630813953488372,
|
|
"grad_norm": 0.4581547282472409,
|
|
"learning_rate": 3.1439178398073896e-05,
|
|
"loss": 0.2561,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10915856063365936,
|
|
"step": 1810,
|
|
"valid_targets_mean": 3889.6,
|
|
"valid_targets_min": 545
|
|
},
|
|
{
|
|
"epoch": 2.6380813953488373,
|
|
"grad_norm": 0.49063719223863217,
|
|
"learning_rate": 3.137964348053578e-05,
|
|
"loss": 0.2704,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11040124297142029,
|
|
"step": 1815,
|
|
"valid_targets_mean": 3438.1,
|
|
"valid_targets_min": 642
|
|
},
|
|
{
|
|
"epoch": 2.645348837209302,
|
|
"grad_norm": 0.5163640076530557,
|
|
"learning_rate": 3.1319959080577464e-05,
|
|
"loss": 0.2818,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12543052434921265,
|
|
"step": 1820,
|
|
"valid_targets_mean": 3359.4,
|
|
"valid_targets_min": 905
|
|
},
|
|
{
|
|
"epoch": 2.6526162790697674,
|
|
"grad_norm": 0.5524842388527516,
|
|
"learning_rate": 3.12601259822102e-05,
|
|
"loss": 0.2582,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1084834486246109,
|
|
"step": 1825,
|
|
"valid_targets_mean": 2511.4,
|
|
"valid_targets_min": 571
|
|
},
|
|
{
|
|
"epoch": 2.6598837209302326,
|
|
"grad_norm": 0.4564108099525801,
|
|
"learning_rate": 3.120014497139853e-05,
|
|
"loss": 0.2663,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13041335344314575,
|
|
"step": 1830,
|
|
"valid_targets_mean": 4113.4,
|
|
"valid_targets_min": 751
|
|
},
|
|
{
|
|
"epoch": 2.667151162790698,
|
|
"grad_norm": 0.5154330112071223,
|
|
"learning_rate": 3.114001683604999e-05,
|
|
"loss": 0.2655,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13782872259616852,
|
|
"step": 1835,
|
|
"valid_targets_mean": 3823.5,
|
|
"valid_targets_min": 579
|
|
},
|
|
{
|
|
"epoch": 2.6744186046511627,
|
|
"grad_norm": 0.463060723588905,
|
|
"learning_rate": 3.1079742366004713e-05,
|
|
"loss": 0.252,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1174917072057724,
|
|
"step": 1840,
|
|
"valid_targets_mean": 3915.1,
|
|
"valid_targets_min": 576
|
|
},
|
|
{
|
|
"epoch": 2.681686046511628,
|
|
"grad_norm": 0.5961585496445909,
|
|
"learning_rate": 3.101932235302508e-05,
|
|
"loss": 0.2685,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10630868375301361,
|
|
"step": 1845,
|
|
"valid_targets_mean": 2058.0,
|
|
"valid_targets_min": 586
|
|
},
|
|
{
|
|
"epoch": 2.688953488372093,
|
|
"grad_norm": 0.5109244436734283,
|
|
"learning_rate": 3.095875759078532e-05,
|
|
"loss": 0.2567,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13750335574150085,
|
|
"step": 1850,
|
|
"valid_targets_mean": 4089.5,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 2.696220930232558,
|
|
"grad_norm": 0.5571546603571644,
|
|
"learning_rate": 3.089804887486109e-05,
|
|
"loss": 0.2695,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1483413279056549,
|
|
"step": 1855,
|
|
"valid_targets_mean": 3544.2,
|
|
"valid_targets_min": 506
|
|
},
|
|
{
|
|
"epoch": 2.703488372093023,
|
|
"grad_norm": 0.45865410869498385,
|
|
"learning_rate": 3.083719700271899e-05,
|
|
"loss": 0.2699,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13529357314109802,
|
|
"step": 1860,
|
|
"valid_targets_mean": 4811.1,
|
|
"valid_targets_min": 3742
|
|
},
|
|
{
|
|
"epoch": 2.7107558139534884,
|
|
"grad_norm": 0.48848398241959,
|
|
"learning_rate": 3.0776202773706136e-05,
|
|
"loss": 0.2613,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1369183510541916,
|
|
"step": 1865,
|
|
"valid_targets_mean": 4284.4,
|
|
"valid_targets_min": 773
|
|
},
|
|
{
|
|
"epoch": 2.7180232558139537,
|
|
"grad_norm": 0.4383701642333588,
|
|
"learning_rate": 3.0715066989039634e-05,
|
|
"loss": 0.2583,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12336073815822601,
|
|
"step": 1870,
|
|
"valid_targets_mean": 4134.5,
|
|
"valid_targets_min": 776
|
|
},
|
|
{
|
|
"epoch": 2.7252906976744184,
|
|
"grad_norm": 0.5109306368537913,
|
|
"learning_rate": 3.0653790451796065e-05,
|
|
"loss": 0.2681,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12276113033294678,
|
|
"step": 1875,
|
|
"valid_targets_mean": 3308.4,
|
|
"valid_targets_min": 729
|
|
},
|
|
{
|
|
"epoch": 2.7325581395348837,
|
|
"grad_norm": 0.48931231779838447,
|
|
"learning_rate": 3.05923739669009e-05,
|
|
"loss": 0.2623,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1452603042125702,
|
|
"step": 1880,
|
|
"valid_targets_mean": 4120.5,
|
|
"valid_targets_min": 509
|
|
},
|
|
{
|
|
"epoch": 2.739825581395349,
|
|
"grad_norm": 0.4782124055851078,
|
|
"learning_rate": 3.0530818341117974e-05,
|
|
"loss": 0.2822,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.19867317378520966,
|
|
"step": 1885,
|
|
"valid_targets_mean": 5492.8,
|
|
"valid_targets_min": 3347
|
|
},
|
|
{
|
|
"epoch": 2.7470930232558137,
|
|
"grad_norm": 0.5970060105644365,
|
|
"learning_rate": 3.046912438303887e-05,
|
|
"loss": 0.2689,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.111583411693573,
|
|
"step": 1890,
|
|
"valid_targets_mean": 2921.2,
|
|
"valid_targets_min": 547
|
|
},
|
|
{
|
|
"epoch": 2.754360465116279,
|
|
"grad_norm": 0.5695113796330928,
|
|
"learning_rate": 3.040729290307231e-05,
|
|
"loss": 0.2767,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1445031762123108,
|
|
"step": 1895,
|
|
"valid_targets_mean": 3292.2,
|
|
"valid_targets_min": 446
|
|
},
|
|
{
|
|
"epoch": 2.761627906976744,
|
|
"grad_norm": 0.5380566024640052,
|
|
"learning_rate": 3.0345324713433454e-05,
|
|
"loss": 0.2717,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12390387058258057,
|
|
"step": 1900,
|
|
"valid_targets_mean": 2912.6,
|
|
"valid_targets_min": 467
|
|
},
|
|
{
|
|
"epoch": 2.7688953488372094,
|
|
"grad_norm": 0.5700404751058241,
|
|
"learning_rate": 3.0283220628133328e-05,
|
|
"loss": 0.2729,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17504948377609253,
|
|
"step": 1905,
|
|
"valid_targets_mean": 2833.1,
|
|
"valid_targets_min": 711
|
|
},
|
|
{
|
|
"epoch": 2.7761627906976747,
|
|
"grad_norm": 0.5501099285719143,
|
|
"learning_rate": 3.0220981462968038e-05,
|
|
"loss": 0.2735,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11852732300758362,
|
|
"step": 1910,
|
|
"valid_targets_mean": 2703.9,
|
|
"valid_targets_min": 653
|
|
},
|
|
{
|
|
"epoch": 2.7834302325581395,
|
|
"grad_norm": 0.5057554599317371,
|
|
"learning_rate": 3.0158608035508107e-05,
|
|
"loss": 0.2646,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13264814019203186,
|
|
"step": 1915,
|
|
"valid_targets_mean": 3944.9,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 2.7906976744186047,
|
|
"grad_norm": 0.5250685596753014,
|
|
"learning_rate": 3.0096101165087715e-05,
|
|
"loss": 0.2628,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1443638652563095,
|
|
"step": 1920,
|
|
"valid_targets_mean": 3738.5,
|
|
"valid_targets_min": 729
|
|
},
|
|
{
|
|
"epoch": 2.7979651162790695,
|
|
"grad_norm": 0.47324933535416364,
|
|
"learning_rate": 3.0033461672793946e-05,
|
|
"loss": 0.2672,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.125032439827919,
|
|
"step": 1925,
|
|
"valid_targets_mean": 3828.5,
|
|
"valid_targets_min": 743
|
|
},
|
|
{
|
|
"epoch": 2.8052325581395348,
|
|
"grad_norm": 0.4955622085267105,
|
|
"learning_rate": 2.9970690381456e-05,
|
|
"loss": 0.2502,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1393406242132187,
|
|
"step": 1930,
|
|
"valid_targets_mean": 3930.9,
|
|
"valid_targets_min": 603
|
|
},
|
|
{
|
|
"epoch": 2.8125,
|
|
"grad_norm": 0.5130630695006796,
|
|
"learning_rate": 2.990778811563438e-05,
|
|
"loss": 0.2541,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12806552648544312,
|
|
"step": 1935,
|
|
"valid_targets_mean": 3769.0,
|
|
"valid_targets_min": 691
|
|
},
|
|
{
|
|
"epoch": 2.8197674418604652,
|
|
"grad_norm": 0.6055425321713648,
|
|
"learning_rate": 2.984475570161005e-05,
|
|
"loss": 0.2631,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17337648570537567,
|
|
"step": 1940,
|
|
"valid_targets_mean": 3236.2,
|
|
"valid_targets_min": 867
|
|
},
|
|
{
|
|
"epoch": 2.8270348837209305,
|
|
"grad_norm": 0.5284530228759448,
|
|
"learning_rate": 2.978159396737363e-05,
|
|
"loss": 0.2622,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1735924780368805,
|
|
"step": 1945,
|
|
"valid_targets_mean": 4311.1,
|
|
"valid_targets_min": 715
|
|
},
|
|
{
|
|
"epoch": 2.8343023255813953,
|
|
"grad_norm": 0.510598428920252,
|
|
"learning_rate": 2.9718303742614437e-05,
|
|
"loss": 0.2545,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15028700232505798,
|
|
"step": 1950,
|
|
"valid_targets_mean": 3324.8,
|
|
"valid_targets_min": 746
|
|
},
|
|
{
|
|
"epoch": 2.8415697674418605,
|
|
"grad_norm": 0.5268476903116217,
|
|
"learning_rate": 2.9654885858709678e-05,
|
|
"loss": 0.2585,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14516228437423706,
|
|
"step": 1955,
|
|
"valid_targets_mean": 3818.1,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 2.8488372093023253,
|
|
"grad_norm": 0.6076295209820001,
|
|
"learning_rate": 2.9591341148713444e-05,
|
|
"loss": 0.2654,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16147010028362274,
|
|
"step": 1960,
|
|
"valid_targets_mean": 2661.6,
|
|
"valid_targets_min": 459
|
|
},
|
|
{
|
|
"epoch": 2.8561046511627906,
|
|
"grad_norm": 0.5399299301824988,
|
|
"learning_rate": 2.952767044734584e-05,
|
|
"loss": 0.269,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16280090808868408,
|
|
"step": 1965,
|
|
"valid_targets_mean": 3895.5,
|
|
"valid_targets_min": 953
|
|
},
|
|
{
|
|
"epoch": 2.863372093023256,
|
|
"grad_norm": 0.4600176373509559,
|
|
"learning_rate": 2.946387459098196e-05,
|
|
"loss": 0.2542,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1348821073770523,
|
|
"step": 1970,
|
|
"valid_targets_mean": 4237.5,
|
|
"valid_targets_min": 693
|
|
},
|
|
{
|
|
"epoch": 2.870639534883721,
|
|
"grad_norm": 0.48877197485140134,
|
|
"learning_rate": 2.9399954417640956e-05,
|
|
"loss": 0.265,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11835235357284546,
|
|
"step": 1975,
|
|
"valid_targets_mean": 3062.9,
|
|
"valid_targets_min": 736
|
|
},
|
|
{
|
|
"epoch": 2.8779069767441863,
|
|
"grad_norm": 0.5079540827052327,
|
|
"learning_rate": 2.9335910766974977e-05,
|
|
"loss": 0.2777,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13968515396118164,
|
|
"step": 1980,
|
|
"valid_targets_mean": 3577.6,
|
|
"valid_targets_min": 654
|
|
},
|
|
{
|
|
"epoch": 2.885174418604651,
|
|
"grad_norm": 0.4539764539432686,
|
|
"learning_rate": 2.9271744480258174e-05,
|
|
"loss": 0.2529,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1398291289806366,
|
|
"step": 1985,
|
|
"valid_targets_mean": 4915.9,
|
|
"valid_targets_min": 3623
|
|
},
|
|
{
|
|
"epoch": 2.8924418604651163,
|
|
"grad_norm": 0.49174216690290445,
|
|
"learning_rate": 2.9207456400375646e-05,
|
|
"loss": 0.2762,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12449312955141068,
|
|
"step": 1990,
|
|
"valid_targets_mean": 3380.0,
|
|
"valid_targets_min": 697
|
|
},
|
|
{
|
|
"epoch": 2.8997093023255816,
|
|
"grad_norm": 0.5689923342535651,
|
|
"learning_rate": 2.914304737181234e-05,
|
|
"loss": 0.2845,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14871911704540253,
|
|
"step": 1995,
|
|
"valid_targets_mean": 3037.6,
|
|
"valid_targets_min": 810
|
|
},
|
|
{
|
|
"epoch": 2.9069767441860463,
|
|
"grad_norm": 0.5300076144454899,
|
|
"learning_rate": 2.9078518240642e-05,
|
|
"loss": 0.2688,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14786851406097412,
|
|
"step": 2000,
|
|
"valid_targets_mean": 3872.2,
|
|
"valid_targets_min": 634
|
|
},
|
|
{
|
|
"epoch": 2.9142441860465116,
|
|
"grad_norm": 0.5110415901667488,
|
|
"learning_rate": 2.9013869854516028e-05,
|
|
"loss": 0.2543,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10360009968280792,
|
|
"step": 2005,
|
|
"valid_targets_mean": 2512.8,
|
|
"valid_targets_min": 567
|
|
},
|
|
{
|
|
"epoch": 2.921511627906977,
|
|
"grad_norm": 0.5373767986536778,
|
|
"learning_rate": 2.894910306265234e-05,
|
|
"loss": 0.2635,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12088128924369812,
|
|
"step": 2010,
|
|
"valid_targets_mean": 2757.8,
|
|
"valid_targets_min": 409
|
|
},
|
|
{
|
|
"epoch": 2.928779069767442,
|
|
"grad_norm": 0.4797863204246029,
|
|
"learning_rate": 2.888421871582423e-05,
|
|
"loss": 0.2726,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13703224062919617,
|
|
"step": 2015,
|
|
"valid_targets_mean": 3601.5,
|
|
"valid_targets_min": 718
|
|
},
|
|
{
|
|
"epoch": 2.936046511627907,
|
|
"grad_norm": 0.45472505465476615,
|
|
"learning_rate": 2.8819217666349198e-05,
|
|
"loss": 0.2622,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16491886973381042,
|
|
"step": 2020,
|
|
"valid_targets_mean": 5240.4,
|
|
"valid_targets_min": 696
|
|
},
|
|
{
|
|
"epoch": 2.943313953488372,
|
|
"grad_norm": 0.4669182737298547,
|
|
"learning_rate": 2.8754100768077743e-05,
|
|
"loss": 0.2525,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14050084352493286,
|
|
"step": 2025,
|
|
"valid_targets_mean": 4352.5,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 2.9505813953488373,
|
|
"grad_norm": 0.4969448731159028,
|
|
"learning_rate": 2.8688868876382122e-05,
|
|
"loss": 0.2582,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18493834137916565,
|
|
"step": 2030,
|
|
"valid_targets_mean": 5092.4,
|
|
"valid_targets_min": 712
|
|
},
|
|
{
|
|
"epoch": 2.957848837209302,
|
|
"grad_norm": 0.5489219835086259,
|
|
"learning_rate": 2.862352284814518e-05,
|
|
"loss": 0.2594,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16094838082790375,
|
|
"step": 2035,
|
|
"valid_targets_mean": 3309.8,
|
|
"valid_targets_min": 594
|
|
},
|
|
{
|
|
"epoch": 2.9651162790697674,
|
|
"grad_norm": 0.5671735062946283,
|
|
"learning_rate": 2.855806354174901e-05,
|
|
"loss": 0.2699,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13544762134552002,
|
|
"step": 2040,
|
|
"valid_targets_mean": 2860.4,
|
|
"valid_targets_min": 727
|
|
},
|
|
{
|
|
"epoch": 2.9723837209302326,
|
|
"grad_norm": 0.43043332486830155,
|
|
"learning_rate": 2.8492491817063767e-05,
|
|
"loss": 0.2638,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12342862784862518,
|
|
"step": 2045,
|
|
"valid_targets_mean": 4274.9,
|
|
"valid_targets_min": 692
|
|
},
|
|
{
|
|
"epoch": 2.979651162790698,
|
|
"grad_norm": 0.4888778059104538,
|
|
"learning_rate": 2.8426808535436294e-05,
|
|
"loss": 0.254,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12098248302936554,
|
|
"step": 2050,
|
|
"valid_targets_mean": 3508.0,
|
|
"valid_targets_min": 736
|
|
},
|
|
{
|
|
"epoch": 2.9869186046511627,
|
|
"grad_norm": 0.4868623719386895,
|
|
"learning_rate": 2.8361014559678856e-05,
|
|
"loss": 0.2592,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12850888073444366,
|
|
"step": 2055,
|
|
"valid_targets_mean": 3452.1,
|
|
"valid_targets_min": 532
|
|
},
|
|
{
|
|
"epoch": 2.994186046511628,
|
|
"grad_norm": 0.543954289354496,
|
|
"learning_rate": 2.8295110754057776e-05,
|
|
"loss": 0.2552,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11905788630247116,
|
|
"step": 2060,
|
|
"valid_targets_mean": 2484.2,
|
|
"valid_targets_min": 753
|
|
},
|
|
{
|
|
"epoch": 3.001453488372093,
|
|
"grad_norm": 0.46396982089080563,
|
|
"learning_rate": 2.822909798428211e-05,
|
|
"loss": 0.2498,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11284950375556946,
|
|
"step": 2065,
|
|
"valid_targets_mean": 3787.8,
|
|
"valid_targets_min": 832
|
|
},
|
|
{
|
|
"epoch": 3.008720930232558,
|
|
"grad_norm": 0.5132727999413913,
|
|
"learning_rate": 2.8162977117492257e-05,
|
|
"loss": 0.2634,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12710949778556824,
|
|
"step": 2070,
|
|
"valid_targets_mean": 3843.4,
|
|
"valid_targets_min": 753
|
|
},
|
|
{
|
|
"epoch": 3.015988372093023,
|
|
"grad_norm": 0.5336380637710425,
|
|
"learning_rate": 2.809674902224857e-05,
|
|
"loss": 0.2532,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1240164041519165,
|
|
"step": 2075,
|
|
"valid_targets_mean": 3290.1,
|
|
"valid_targets_min": 748
|
|
},
|
|
{
|
|
"epoch": 3.0232558139534884,
|
|
"grad_norm": 0.46893864837995336,
|
|
"learning_rate": 2.8030414568519963e-05,
|
|
"loss": 0.2547,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13958200812339783,
|
|
"step": 2080,
|
|
"valid_targets_mean": 4292.2,
|
|
"valid_targets_min": 855
|
|
},
|
|
{
|
|
"epoch": 3.0305232558139537,
|
|
"grad_norm": 0.4471657539573157,
|
|
"learning_rate": 2.796397462767245e-05,
|
|
"loss": 0.2467,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1111362874507904,
|
|
"step": 2085,
|
|
"valid_targets_mean": 5043.8,
|
|
"valid_targets_min": 3454
|
|
},
|
|
{
|
|
"epoch": 3.0377906976744184,
|
|
"grad_norm": 0.5752757770371824,
|
|
"learning_rate": 2.7897430072457733e-05,
|
|
"loss": 0.2504,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12422748655080795,
|
|
"step": 2090,
|
|
"valid_targets_mean": 3479.4,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 3.0450581395348837,
|
|
"grad_norm": 0.506386742480055,
|
|
"learning_rate": 2.7830781777001706e-05,
|
|
"loss": 0.2642,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.099161796271801,
|
|
"step": 2095,
|
|
"valid_targets_mean": 3415.2,
|
|
"valid_targets_min": 483
|
|
},
|
|
{
|
|
"epoch": 3.052325581395349,
|
|
"grad_norm": 0.5905823245995147,
|
|
"learning_rate": 2.7764030616793017e-05,
|
|
"loss": 0.2567,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13965487480163574,
|
|
"step": 2100,
|
|
"valid_targets_mean": 2516.0,
|
|
"valid_targets_min": 528
|
|
},
|
|
{
|
|
"epoch": 3.059593023255814,
|
|
"grad_norm": 0.5387909462740589,
|
|
"learning_rate": 2.7697177468671516e-05,
|
|
"loss": 0.2604,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1169048324227333,
|
|
"step": 2105,
|
|
"valid_targets_mean": 3728.0,
|
|
"valid_targets_min": 552
|
|
},
|
|
{
|
|
"epoch": 3.066860465116279,
|
|
"grad_norm": 0.5149001542580065,
|
|
"learning_rate": 2.7630223210816765e-05,
|
|
"loss": 0.2604,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11615493893623352,
|
|
"step": 2110,
|
|
"valid_targets_mean": 3848.2,
|
|
"valid_targets_min": 737
|
|
},
|
|
{
|
|
"epoch": 3.074127906976744,
|
|
"grad_norm": 0.4829088029098308,
|
|
"learning_rate": 2.7563168722736517e-05,
|
|
"loss": 0.2624,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11458876729011536,
|
|
"step": 2115,
|
|
"valid_targets_mean": 4425.9,
|
|
"valid_targets_min": 587
|
|
},
|
|
{
|
|
"epoch": 3.0813953488372094,
|
|
"grad_norm": 0.6073559587335657,
|
|
"learning_rate": 2.749601488525512e-05,
|
|
"loss": 0.2511,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13436372578144073,
|
|
"step": 2120,
|
|
"valid_targets_mean": 3094.0,
|
|
"valid_targets_min": 509
|
|
},
|
|
{
|
|
"epoch": 3.0886627906976742,
|
|
"grad_norm": 0.49969662117819635,
|
|
"learning_rate": 2.7428762580501982e-05,
|
|
"loss": 0.2506,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14222140610218048,
|
|
"step": 2125,
|
|
"valid_targets_mean": 4020.0,
|
|
"valid_targets_min": 907
|
|
},
|
|
{
|
|
"epoch": 3.0959302325581395,
|
|
"grad_norm": 0.5204880529542931,
|
|
"learning_rate": 2.7361412691899972e-05,
|
|
"loss": 0.2561,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10934726893901825,
|
|
"step": 2130,
|
|
"valid_targets_mean": 3369.4,
|
|
"valid_targets_min": 774
|
|
},
|
|
{
|
|
"epoch": 3.1031976744186047,
|
|
"grad_norm": 0.5592250434484849,
|
|
"learning_rate": 2.7293966104153814e-05,
|
|
"loss": 0.2423,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0901477187871933,
|
|
"step": 2135,
|
|
"valid_targets_mean": 2053.5,
|
|
"valid_targets_min": 597
|
|
},
|
|
{
|
|
"epoch": 3.11046511627907,
|
|
"grad_norm": 0.5152668405523907,
|
|
"learning_rate": 2.722642370323847e-05,
|
|
"loss": 0.2495,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11756094545125961,
|
|
"step": 2140,
|
|
"valid_targets_mean": 3801.4,
|
|
"valid_targets_min": 741
|
|
},
|
|
{
|
|
"epoch": 3.1177325581395348,
|
|
"grad_norm": 0.5272762330048814,
|
|
"learning_rate": 2.7158786376387486e-05,
|
|
"loss": 0.2492,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13304001092910767,
|
|
"step": 2145,
|
|
"valid_targets_mean": 3903.8,
|
|
"valid_targets_min": 3133
|
|
},
|
|
{
|
|
"epoch": 3.125,
|
|
"grad_norm": 0.6150488499289717,
|
|
"learning_rate": 2.7091055012081376e-05,
|
|
"loss": 0.2423,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12594833970069885,
|
|
"step": 2150,
|
|
"valid_targets_mean": 2698.0,
|
|
"valid_targets_min": 609
|
|
},
|
|
{
|
|
"epoch": 3.1322674418604652,
|
|
"grad_norm": 0.4675225384238192,
|
|
"learning_rate": 2.7023230500035896e-05,
|
|
"loss": 0.2499,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12618444859981537,
|
|
"step": 2155,
|
|
"valid_targets_mean": 4309.4,
|
|
"valid_targets_min": 677
|
|
},
|
|
{
|
|
"epoch": 3.13953488372093,
|
|
"grad_norm": 0.6332751429296548,
|
|
"learning_rate": 2.6955313731190412e-05,
|
|
"loss": 0.2605,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1332174837589264,
|
|
"step": 2160,
|
|
"valid_targets_mean": 2770.2,
|
|
"valid_targets_min": 622
|
|
},
|
|
{
|
|
"epoch": 3.1468023255813953,
|
|
"grad_norm": 0.8559144896636022,
|
|
"learning_rate": 2.688730559769615e-05,
|
|
"loss": 0.2523,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12001748383045197,
|
|
"step": 2165,
|
|
"valid_targets_mean": 4595.1,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 3.1540697674418605,
|
|
"grad_norm": 0.5931117865157438,
|
|
"learning_rate": 2.6819206992904508e-05,
|
|
"loss": 0.2504,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14907360076904297,
|
|
"step": 2170,
|
|
"valid_targets_mean": 2909.9,
|
|
"valid_targets_min": 387
|
|
},
|
|
{
|
|
"epoch": 3.1613372093023258,
|
|
"grad_norm": 0.5490654340936475,
|
|
"learning_rate": 2.6751018811355307e-05,
|
|
"loss": 0.2463,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10953619331121445,
|
|
"step": 2175,
|
|
"valid_targets_mean": 2857.0,
|
|
"valid_targets_min": 778
|
|
},
|
|
{
|
|
"epoch": 3.1686046511627906,
|
|
"grad_norm": 0.5199051841020532,
|
|
"learning_rate": 2.6682741948765047e-05,
|
|
"loss": 0.2454,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13250568509101868,
|
|
"step": 2180,
|
|
"valid_targets_mean": 3317.5,
|
|
"valid_targets_min": 702
|
|
},
|
|
{
|
|
"epoch": 3.175872093023256,
|
|
"grad_norm": 0.48877762491217913,
|
|
"learning_rate": 2.661437730201514e-05,
|
|
"loss": 0.2548,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1184430867433548,
|
|
"step": 2185,
|
|
"valid_targets_mean": 3868.5,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 3.183139534883721,
|
|
"grad_norm": 0.5413434386944661,
|
|
"learning_rate": 2.654592576914011e-05,
|
|
"loss": 0.2451,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11572098731994629,
|
|
"step": 2190,
|
|
"valid_targets_mean": 2643.5,
|
|
"valid_targets_min": 840
|
|
},
|
|
{
|
|
"epoch": 3.1904069767441863,
|
|
"grad_norm": 0.4826257777252111,
|
|
"learning_rate": 2.6477388249315836e-05,
|
|
"loss": 0.2446,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11999189108610153,
|
|
"step": 2195,
|
|
"valid_targets_mean": 4661.1,
|
|
"valid_targets_min": 700
|
|
},
|
|
{
|
|
"epoch": 3.197674418604651,
|
|
"grad_norm": 0.532187618449715,
|
|
"learning_rate": 2.6408765642847698e-05,
|
|
"loss": 0.2558,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1451462358236313,
|
|
"step": 2200,
|
|
"valid_targets_mean": 3591.5,
|
|
"valid_targets_min": 612
|
|
},
|
|
{
|
|
"epoch": 3.2049418604651163,
|
|
"grad_norm": 0.49122871352752695,
|
|
"learning_rate": 2.6340058851158788e-05,
|
|
"loss": 0.2538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12171737849712372,
|
|
"step": 2205,
|
|
"valid_targets_mean": 3890.9,
|
|
"valid_targets_min": 925
|
|
},
|
|
{
|
|
"epoch": 3.2122093023255816,
|
|
"grad_norm": 0.48972445158403766,
|
|
"learning_rate": 2.6271268776778032e-05,
|
|
"loss": 0.2412,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13735152781009674,
|
|
"step": 2210,
|
|
"valid_targets_mean": 4153.9,
|
|
"valid_targets_min": 753
|
|
},
|
|
{
|
|
"epoch": 3.2194767441860463,
|
|
"grad_norm": 0.46822601101112704,
|
|
"learning_rate": 2.6202396323328357e-05,
|
|
"loss": 0.2435,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1055523157119751,
|
|
"step": 2215,
|
|
"valid_targets_mean": 3463.5,
|
|
"valid_targets_min": 497
|
|
},
|
|
{
|
|
"epoch": 3.2267441860465116,
|
|
"grad_norm": 0.5416109151148425,
|
|
"learning_rate": 2.6133442395514833e-05,
|
|
"loss": 0.2612,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1550188809633255,
|
|
"step": 2220,
|
|
"valid_targets_mean": 3869.2,
|
|
"valid_targets_min": 313
|
|
},
|
|
{
|
|
"epoch": 3.234011627906977,
|
|
"grad_norm": 0.4642704975191872,
|
|
"learning_rate": 2.606440789911276e-05,
|
|
"loss": 0.2476,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10453011095523834,
|
|
"step": 2225,
|
|
"valid_targets_mean": 3596.6,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 3.241279069767442,
|
|
"grad_norm": 0.4661250426831108,
|
|
"learning_rate": 2.599529374095578e-05,
|
|
"loss": 0.2508,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.135253444314003,
|
|
"step": 2230,
|
|
"valid_targets_mean": 4895.1,
|
|
"valid_targets_min": 684
|
|
},
|
|
{
|
|
"epoch": 3.248546511627907,
|
|
"grad_norm": 0.5039451072942192,
|
|
"learning_rate": 2.5926100828923985e-05,
|
|
"loss": 0.2435,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12384626269340515,
|
|
"step": 2235,
|
|
"valid_targets_mean": 4168.6,
|
|
"valid_targets_min": 805
|
|
},
|
|
{
|
|
"epoch": 3.255813953488372,
|
|
"grad_norm": 0.46502877427362305,
|
|
"learning_rate": 2.5856830071931944e-05,
|
|
"loss": 0.2583,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11560146510601044,
|
|
"step": 2240,
|
|
"valid_targets_mean": 4750.0,
|
|
"valid_targets_min": 4164
|
|
},
|
|
{
|
|
"epoch": 3.2630813953488373,
|
|
"grad_norm": 0.5425286991972637,
|
|
"learning_rate": 2.578748237991682e-05,
|
|
"loss": 0.2588,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13858449459075928,
|
|
"step": 2245,
|
|
"valid_targets_mean": 3679.4,
|
|
"valid_targets_min": 850
|
|
},
|
|
{
|
|
"epoch": 3.270348837209302,
|
|
"grad_norm": 0.5496468651661625,
|
|
"learning_rate": 2.571805866382638e-05,
|
|
"loss": 0.2553,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.108754001557827,
|
|
"step": 2250,
|
|
"valid_targets_mean": 3159.8,
|
|
"valid_targets_min": 818
|
|
},
|
|
{
|
|
"epoch": 3.2776162790697674,
|
|
"grad_norm": 0.4963269407533553,
|
|
"learning_rate": 2.5648559835607047e-05,
|
|
"loss": 0.245,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1490362286567688,
|
|
"step": 2255,
|
|
"valid_targets_mean": 4346.9,
|
|
"valid_targets_min": 560
|
|
},
|
|
{
|
|
"epoch": 3.2848837209302326,
|
|
"grad_norm": 0.5040364962140519,
|
|
"learning_rate": 2.5578986808191904e-05,
|
|
"loss": 0.2502,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13290151953697205,
|
|
"step": 2260,
|
|
"valid_targets_mean": 4253.6,
|
|
"valid_targets_min": 882
|
|
},
|
|
{
|
|
"epoch": 3.292151162790698,
|
|
"grad_norm": 0.517643889938687,
|
|
"learning_rate": 2.5509340495488707e-05,
|
|
"loss": 0.2443,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.18137292563915253,
|
|
"step": 2265,
|
|
"valid_targets_mean": 4854.5,
|
|
"valid_targets_min": 4012
|
|
},
|
|
{
|
|
"epoch": 3.2994186046511627,
|
|
"grad_norm": 0.5599724940409381,
|
|
"learning_rate": 2.5439621812367907e-05,
|
|
"loss": 0.2558,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09955041110515594,
|
|
"step": 2270,
|
|
"valid_targets_mean": 2542.8,
|
|
"valid_targets_min": 471
|
|
},
|
|
{
|
|
"epoch": 3.306686046511628,
|
|
"grad_norm": 0.42419128765888825,
|
|
"learning_rate": 2.5369831674650572e-05,
|
|
"loss": 0.2504,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12508805096149445,
|
|
"step": 2275,
|
|
"valid_targets_mean": 5078.4,
|
|
"valid_targets_min": 714
|
|
},
|
|
{
|
|
"epoch": 3.313953488372093,
|
|
"grad_norm": 0.524949050763777,
|
|
"learning_rate": 2.529997099909643e-05,
|
|
"loss": 0.2542,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14017917215824127,
|
|
"step": 2280,
|
|
"valid_targets_mean": 3980.0,
|
|
"valid_targets_min": 867
|
|
},
|
|
{
|
|
"epoch": 3.321220930232558,
|
|
"grad_norm": 0.44629089394261284,
|
|
"learning_rate": 2.5230040703391775e-05,
|
|
"loss": 0.2394,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09534334391355515,
|
|
"step": 2285,
|
|
"valid_targets_mean": 4047.8,
|
|
"valid_targets_min": 3198
|
|
},
|
|
{
|
|
"epoch": 3.328488372093023,
|
|
"grad_norm": 0.5471725041255697,
|
|
"learning_rate": 2.5160041706137424e-05,
|
|
"loss": 0.2497,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13267022371292114,
|
|
"step": 2290,
|
|
"valid_targets_mean": 4100.4,
|
|
"valid_targets_min": 988
|
|
},
|
|
{
|
|
"epoch": 3.3357558139534884,
|
|
"grad_norm": 0.47706431071080707,
|
|
"learning_rate": 2.508997492683666e-05,
|
|
"loss": 0.2372,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1036720871925354,
|
|
"step": 2295,
|
|
"valid_targets_mean": 3625.9,
|
|
"valid_targets_min": 766
|
|
},
|
|
{
|
|
"epoch": 3.3430232558139537,
|
|
"grad_norm": 0.46979061384683135,
|
|
"learning_rate": 2.5019841285883143e-05,
|
|
"loss": 0.2378,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14231424033641815,
|
|
"step": 2300,
|
|
"valid_targets_mean": 4415.0,
|
|
"valid_targets_min": 746
|
|
},
|
|
{
|
|
"epoch": 3.3502906976744184,
|
|
"grad_norm": 0.46840855749044336,
|
|
"learning_rate": 2.4949641704548834e-05,
|
|
"loss": 0.2378,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10291890799999237,
|
|
"step": 2305,
|
|
"valid_targets_mean": 3752.5,
|
|
"valid_targets_min": 594
|
|
},
|
|
{
|
|
"epoch": 3.3575581395348837,
|
|
"grad_norm": 0.4787805064264873,
|
|
"learning_rate": 2.4879377104971863e-05,
|
|
"loss": 0.2462,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11151669174432755,
|
|
"step": 2310,
|
|
"valid_targets_mean": 4007.1,
|
|
"valid_targets_min": 570
|
|
},
|
|
{
|
|
"epoch": 3.364825581395349,
|
|
"grad_norm": 0.5134464582083824,
|
|
"learning_rate": 2.4809048410144467e-05,
|
|
"loss": 0.2461,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.136276975274086,
|
|
"step": 2315,
|
|
"valid_targets_mean": 3642.0,
|
|
"valid_targets_min": 671
|
|
},
|
|
{
|
|
"epoch": 3.3720930232558137,
|
|
"grad_norm": 0.4545347794500175,
|
|
"learning_rate": 2.4738656543900808e-05,
|
|
"loss": 0.2436,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10940147936344147,
|
|
"step": 2320,
|
|
"valid_targets_mean": 3730.6,
|
|
"valid_targets_min": 953
|
|
},
|
|
{
|
|
"epoch": 3.379360465116279,
|
|
"grad_norm": 0.46413507712775337,
|
|
"learning_rate": 2.4668202430904872e-05,
|
|
"loss": 0.2469,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12754136323928833,
|
|
"step": 2325,
|
|
"valid_targets_mean": 4426.5,
|
|
"valid_targets_min": 1194
|
|
},
|
|
{
|
|
"epoch": 3.386627906976744,
|
|
"grad_norm": 0.49443156483084405,
|
|
"learning_rate": 2.4597686996638334e-05,
|
|
"loss": 0.2584,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11726079881191254,
|
|
"step": 2330,
|
|
"valid_targets_mean": 3938.8,
|
|
"valid_targets_min": 800
|
|
},
|
|
{
|
|
"epoch": 3.3938953488372094,
|
|
"grad_norm": 0.4885507906087015,
|
|
"learning_rate": 2.452711116738834e-05,
|
|
"loss": 0.2442,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10095968097448349,
|
|
"step": 2335,
|
|
"valid_targets_mean": 3261.5,
|
|
"valid_targets_min": 626
|
|
},
|
|
{
|
|
"epoch": 3.4011627906976742,
|
|
"grad_norm": 0.5343896962809889,
|
|
"learning_rate": 2.4456475870235433e-05,
|
|
"loss": 0.2468,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16157086193561554,
|
|
"step": 2340,
|
|
"valid_targets_mean": 3889.4,
|
|
"valid_targets_min": 796
|
|
},
|
|
{
|
|
"epoch": 3.4084302325581395,
|
|
"grad_norm": 0.4808257217663416,
|
|
"learning_rate": 2.4385782033041282e-05,
|
|
"loss": 0.2333,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09912088513374329,
|
|
"step": 2345,
|
|
"valid_targets_mean": 3184.6,
|
|
"valid_targets_min": 726
|
|
},
|
|
{
|
|
"epoch": 3.4156976744186047,
|
|
"grad_norm": 0.48604724440506825,
|
|
"learning_rate": 2.431503058443655e-05,
|
|
"loss": 0.2453,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11162015795707703,
|
|
"step": 2350,
|
|
"valid_targets_mean": 3422.1,
|
|
"valid_targets_min": 667
|
|
},
|
|
{
|
|
"epoch": 3.4229651162790695,
|
|
"grad_norm": 0.4864948711793094,
|
|
"learning_rate": 2.4244222453808694e-05,
|
|
"loss": 0.2571,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1151517927646637,
|
|
"step": 2355,
|
|
"valid_targets_mean": 4209.6,
|
|
"valid_targets_min": 857
|
|
},
|
|
{
|
|
"epoch": 3.4302325581395348,
|
|
"grad_norm": 0.5073998403953838,
|
|
"learning_rate": 2.4173358571289716e-05,
|
|
"loss": 0.2532,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16314566135406494,
|
|
"step": 2360,
|
|
"valid_targets_mean": 4723.2,
|
|
"valid_targets_min": 810
|
|
},
|
|
{
|
|
"epoch": 3.4375,
|
|
"grad_norm": 0.543424876760199,
|
|
"learning_rate": 2.4102439867743995e-05,
|
|
"loss": 0.2477,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09115774184465408,
|
|
"step": 2365,
|
|
"valid_targets_mean": 2121.8,
|
|
"valid_targets_min": 586
|
|
},
|
|
{
|
|
"epoch": 3.4447674418604652,
|
|
"grad_norm": 0.43803750016335147,
|
|
"learning_rate": 2.4031467274756026e-05,
|
|
"loss": 0.2402,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13034743070602417,
|
|
"step": 2370,
|
|
"valid_targets_mean": 4575.1,
|
|
"valid_targets_min": 1213
|
|
},
|
|
{
|
|
"epoch": 3.4520348837209305,
|
|
"grad_norm": 1.022884642404884,
|
|
"learning_rate": 2.3960441724618195e-05,
|
|
"loss": 0.2536,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10168780386447906,
|
|
"step": 2375,
|
|
"valid_targets_mean": 3031.5,
|
|
"valid_targets_min": 627
|
|
},
|
|
{
|
|
"epoch": 3.4593023255813953,
|
|
"grad_norm": 0.47224341467442843,
|
|
"learning_rate": 2.3889364150318523e-05,
|
|
"loss": 0.2593,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11175704002380371,
|
|
"step": 2380,
|
|
"valid_targets_mean": 4139.5,
|
|
"valid_targets_min": 790
|
|
},
|
|
{
|
|
"epoch": 3.4665697674418605,
|
|
"grad_norm": 0.5537350873058593,
|
|
"learning_rate": 2.3818235485528438e-05,
|
|
"loss": 0.2612,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09244590997695923,
|
|
"step": 2385,
|
|
"valid_targets_mean": 2139.6,
|
|
"valid_targets_min": 626
|
|
},
|
|
{
|
|
"epoch": 3.4738372093023258,
|
|
"grad_norm": 0.48412371898831763,
|
|
"learning_rate": 2.374705666459046e-05,
|
|
"loss": 0.2562,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11267127841711044,
|
|
"step": 2390,
|
|
"valid_targets_mean": 3562.9,
|
|
"valid_targets_min": 693
|
|
},
|
|
{
|
|
"epoch": 3.4811046511627906,
|
|
"grad_norm": 0.5112459040365906,
|
|
"learning_rate": 2.367582862250599e-05,
|
|
"loss": 0.2451,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11210276186466217,
|
|
"step": 2395,
|
|
"valid_targets_mean": 3276.8,
|
|
"valid_targets_min": 591
|
|
},
|
|
{
|
|
"epoch": 3.488372093023256,
|
|
"grad_norm": 0.4904007106936307,
|
|
"learning_rate": 2.3604552294922974e-05,
|
|
"loss": 0.2473,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12592178583145142,
|
|
"step": 2400,
|
|
"valid_targets_mean": 4156.2,
|
|
"valid_targets_min": 805
|
|
},
|
|
{
|
|
"epoch": 3.495639534883721,
|
|
"grad_norm": 0.5533230425308654,
|
|
"learning_rate": 2.353322861812364e-05,
|
|
"loss": 0.2542,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10514762997627258,
|
|
"step": 2405,
|
|
"valid_targets_mean": 2583.9,
|
|
"valid_targets_min": 246
|
|
},
|
|
{
|
|
"epoch": 3.5029069767441863,
|
|
"grad_norm": 0.4769266460610174,
|
|
"learning_rate": 2.346185852901219e-05,
|
|
"loss": 0.2423,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10916031897068024,
|
|
"step": 2410,
|
|
"valid_targets_mean": 3479.1,
|
|
"valid_targets_min": 807
|
|
},
|
|
{
|
|
"epoch": 3.510174418604651,
|
|
"grad_norm": 0.4891779772353748,
|
|
"learning_rate": 2.3390442965102503e-05,
|
|
"loss": 0.2449,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1259600967168808,
|
|
"step": 2415,
|
|
"valid_targets_mean": 3885.2,
|
|
"valid_targets_min": 650
|
|
},
|
|
{
|
|
"epoch": 3.5174418604651163,
|
|
"grad_norm": 0.45544094475272356,
|
|
"learning_rate": 2.3318982864505806e-05,
|
|
"loss": 0.2572,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11584748327732086,
|
|
"step": 2420,
|
|
"valid_targets_mean": 4185.8,
|
|
"valid_targets_min": 480
|
|
},
|
|
{
|
|
"epoch": 3.5247093023255816,
|
|
"grad_norm": 0.4766624640907669,
|
|
"learning_rate": 2.324747916591836e-05,
|
|
"loss": 0.252,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13836249709129333,
|
|
"step": 2425,
|
|
"valid_targets_mean": 4399.9,
|
|
"valid_targets_min": 1044
|
|
},
|
|
{
|
|
"epoch": 3.5319767441860463,
|
|
"grad_norm": 0.4650029600411716,
|
|
"learning_rate": 2.317593280860913e-05,
|
|
"loss": 0.2333,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12125978618860245,
|
|
"step": 2430,
|
|
"valid_targets_mean": 4253.5,
|
|
"valid_targets_min": 635
|
|
},
|
|
{
|
|
"epoch": 3.5392441860465116,
|
|
"grad_norm": 0.5028829055009032,
|
|
"learning_rate": 2.3104344732407436e-05,
|
|
"loss": 0.2545,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11511494219303131,
|
|
"step": 2435,
|
|
"valid_targets_mean": 3393.1,
|
|
"valid_targets_min": 986
|
|
},
|
|
{
|
|
"epoch": 3.546511627906977,
|
|
"grad_norm": 0.5174631620772431,
|
|
"learning_rate": 2.3032715877690622e-05,
|
|
"loss": 0.2392,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1459505259990692,
|
|
"step": 2440,
|
|
"valid_targets_mean": 4194.1,
|
|
"valid_targets_min": 750
|
|
},
|
|
{
|
|
"epoch": 3.553779069767442,
|
|
"grad_norm": 0.46778152593245964,
|
|
"learning_rate": 2.296104718537169e-05,
|
|
"loss": 0.2527,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16303589940071106,
|
|
"step": 2445,
|
|
"valid_targets_mean": 5621.5,
|
|
"valid_targets_min": 516
|
|
},
|
|
{
|
|
"epoch": 3.561046511627907,
|
|
"grad_norm": 0.5035401466652747,
|
|
"learning_rate": 2.2889339596886958e-05,
|
|
"loss": 0.2504,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12182118743658066,
|
|
"step": 2450,
|
|
"valid_targets_mean": 4179.8,
|
|
"valid_targets_min": 711
|
|
},
|
|
{
|
|
"epoch": 3.568313953488372,
|
|
"grad_norm": 0.4949500654402859,
|
|
"learning_rate": 2.2817594054183675e-05,
|
|
"loss": 0.2423,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12568366527557373,
|
|
"step": 2455,
|
|
"valid_targets_mean": 4049.9,
|
|
"valid_targets_min": 792
|
|
},
|
|
{
|
|
"epoch": 3.5755813953488373,
|
|
"grad_norm": 0.44379194690985047,
|
|
"learning_rate": 2.2745811499707645e-05,
|
|
"loss": 0.2575,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10165221989154816,
|
|
"step": 2460,
|
|
"valid_targets_mean": 3895.0,
|
|
"valid_targets_min": 702
|
|
},
|
|
{
|
|
"epoch": 3.582848837209302,
|
|
"grad_norm": 0.4609499146509756,
|
|
"learning_rate": 2.267399287639088e-05,
|
|
"loss": 0.2395,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13126936554908752,
|
|
"step": 2465,
|
|
"valid_targets_mean": 4307.1,
|
|
"valid_targets_min": 805
|
|
},
|
|
{
|
|
"epoch": 3.5901162790697674,
|
|
"grad_norm": 0.4231243658860352,
|
|
"learning_rate": 2.260213912763917e-05,
|
|
"loss": 0.2458,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1243281364440918,
|
|
"step": 2470,
|
|
"valid_targets_mean": 4944.2,
|
|
"valid_targets_min": 2949
|
|
},
|
|
{
|
|
"epoch": 3.5973837209302326,
|
|
"grad_norm": 0.47982014413778806,
|
|
"learning_rate": 2.2530251197319723e-05,
|
|
"loss": 0.2409,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.108958899974823,
|
|
"step": 2475,
|
|
"valid_targets_mean": 3449.6,
|
|
"valid_targets_min": 493
|
|
},
|
|
{
|
|
"epoch": 3.604651162790698,
|
|
"grad_norm": 0.45227044431491636,
|
|
"learning_rate": 2.2458330029748736e-05,
|
|
"loss": 0.2439,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14309027791023254,
|
|
"step": 2480,
|
|
"valid_targets_mean": 4818.6,
|
|
"valid_targets_min": 3806
|
|
},
|
|
{
|
|
"epoch": 3.6119186046511627,
|
|
"grad_norm": 0.5649909883102694,
|
|
"learning_rate": 2.2386376569679036e-05,
|
|
"loss": 0.2604,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.173073410987854,
|
|
"step": 2485,
|
|
"valid_targets_mean": 4637.1,
|
|
"valid_targets_min": 3900
|
|
},
|
|
{
|
|
"epoch": 3.619186046511628,
|
|
"grad_norm": 0.47610124778582524,
|
|
"learning_rate": 2.231439176228763e-05,
|
|
"loss": 0.2457,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1240810751914978,
|
|
"step": 2490,
|
|
"valid_targets_mean": 3676.1,
|
|
"valid_targets_min": 595
|
|
},
|
|
{
|
|
"epoch": 3.626453488372093,
|
|
"grad_norm": 0.46700625613611785,
|
|
"learning_rate": 2.2242376553163286e-05,
|
|
"loss": 0.2473,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14469364285469055,
|
|
"step": 2495,
|
|
"valid_targets_mean": 4407.5,
|
|
"valid_targets_min": 620
|
|
},
|
|
{
|
|
"epoch": 3.633720930232558,
|
|
"grad_norm": 0.4756222601783613,
|
|
"learning_rate": 2.217033188829416e-05,
|
|
"loss": 0.2541,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1307680308818817,
|
|
"step": 2500,
|
|
"valid_targets_mean": 4861.6,
|
|
"valid_targets_min": 640
|
|
},
|
|
{
|
|
"epoch": 3.640988372093023,
|
|
"grad_norm": 0.5348602172378426,
|
|
"learning_rate": 2.2098258714055303e-05,
|
|
"loss": 0.2523,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16622218489646912,
|
|
"step": 2505,
|
|
"valid_targets_mean": 3662.9,
|
|
"valid_targets_min": 744
|
|
},
|
|
{
|
|
"epoch": 3.6482558139534884,
|
|
"grad_norm": 0.493726960795882,
|
|
"learning_rate": 2.20261579771963e-05,
|
|
"loss": 0.2436,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13390150666236877,
|
|
"step": 2510,
|
|
"valid_targets_mean": 3553.0,
|
|
"valid_targets_min": 556
|
|
},
|
|
{
|
|
"epoch": 3.6555232558139537,
|
|
"grad_norm": 0.48859839931015386,
|
|
"learning_rate": 2.1954030624828757e-05,
|
|
"loss": 0.2532,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14289015531539917,
|
|
"step": 2515,
|
|
"valid_targets_mean": 4269.1,
|
|
"valid_targets_min": 690
|
|
},
|
|
{
|
|
"epoch": 3.6627906976744184,
|
|
"grad_norm": 0.46297329620447086,
|
|
"learning_rate": 2.1881877604413927e-05,
|
|
"loss": 0.2406,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1050468236207962,
|
|
"step": 2520,
|
|
"valid_targets_mean": 3698.4,
|
|
"valid_targets_min": 760
|
|
},
|
|
{
|
|
"epoch": 3.6700581395348837,
|
|
"grad_norm": 0.5273537998892968,
|
|
"learning_rate": 2.1809699863750236e-05,
|
|
"loss": 0.2497,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14382243156433105,
|
|
"step": 2525,
|
|
"valid_targets_mean": 3749.8,
|
|
"valid_targets_min": 626
|
|
},
|
|
{
|
|
"epoch": 3.677325581395349,
|
|
"grad_norm": 0.4888083234986187,
|
|
"learning_rate": 2.1737498350960825e-05,
|
|
"loss": 0.2353,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12603764235973358,
|
|
"step": 2530,
|
|
"valid_targets_mean": 3474.1,
|
|
"valid_targets_min": 532
|
|
},
|
|
{
|
|
"epoch": 3.6845930232558137,
|
|
"grad_norm": 0.5194974843269244,
|
|
"learning_rate": 2.1665274014481112e-05,
|
|
"loss": 0.2528,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13663990795612335,
|
|
"step": 2535,
|
|
"valid_targets_mean": 3533.2,
|
|
"valid_targets_min": 661
|
|
},
|
|
{
|
|
"epoch": 3.691860465116279,
|
|
"grad_norm": 0.48415859865118777,
|
|
"learning_rate": 2.159302780304631e-05,
|
|
"loss": 0.2494,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14904913306236267,
|
|
"step": 2540,
|
|
"valid_targets_mean": 5181.0,
|
|
"valid_targets_min": 3993
|
|
},
|
|
{
|
|
"epoch": 3.699127906976744,
|
|
"grad_norm": 0.5174902951602472,
|
|
"learning_rate": 2.152076066567901e-05,
|
|
"loss": 0.2538,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09818239510059357,
|
|
"step": 2545,
|
|
"valid_targets_mean": 3285.4,
|
|
"valid_targets_min": 477
|
|
},
|
|
{
|
|
"epoch": 3.7063953488372094,
|
|
"grad_norm": 0.45632633047088905,
|
|
"learning_rate": 2.1448473551676644e-05,
|
|
"loss": 0.2427,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12770359218120575,
|
|
"step": 2550,
|
|
"valid_targets_mean": 3832.9,
|
|
"valid_targets_min": 584
|
|
},
|
|
{
|
|
"epoch": 3.7136627906976747,
|
|
"grad_norm": 0.49662233543481427,
|
|
"learning_rate": 2.13761674105991e-05,
|
|
"loss": 0.2523,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14436696469783783,
|
|
"step": 2555,
|
|
"valid_targets_mean": 4149.1,
|
|
"valid_targets_min": 544
|
|
},
|
|
{
|
|
"epoch": 3.7209302325581395,
|
|
"grad_norm": 0.5614542258504909,
|
|
"learning_rate": 2.130384319225617e-05,
|
|
"loss": 0.2478,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1258370727300644,
|
|
"step": 2560,
|
|
"valid_targets_mean": 2940.0,
|
|
"valid_targets_min": 689
|
|
},
|
|
{
|
|
"epoch": 3.7281976744186047,
|
|
"grad_norm": 0.45572529846881993,
|
|
"learning_rate": 2.1231501846695128e-05,
|
|
"loss": 0.2399,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11863773316144943,
|
|
"step": 2565,
|
|
"valid_targets_mean": 3968.6,
|
|
"valid_targets_min": 620
|
|
},
|
|
{
|
|
"epoch": 3.7354651162790695,
|
|
"grad_norm": 0.6015378265452319,
|
|
"learning_rate": 2.115914432418822e-05,
|
|
"loss": 0.2729,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11300826072692871,
|
|
"step": 2570,
|
|
"valid_targets_mean": 2512.4,
|
|
"valid_targets_min": 305
|
|
},
|
|
{
|
|
"epoch": 3.7427325581395348,
|
|
"grad_norm": 0.4742783086567257,
|
|
"learning_rate": 2.1086771575220203e-05,
|
|
"loss": 0.25,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11191293597221375,
|
|
"step": 2575,
|
|
"valid_targets_mean": 3764.5,
|
|
"valid_targets_min": 692
|
|
},
|
|
{
|
|
"epoch": 3.75,
|
|
"grad_norm": 0.616691924655716,
|
|
"learning_rate": 2.1014384550475836e-05,
|
|
"loss": 0.2516,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12944871187210083,
|
|
"step": 2580,
|
|
"valid_targets_mean": 3347.6,
|
|
"valid_targets_min": 559
|
|
},
|
|
{
|
|
"epoch": 3.7572674418604652,
|
|
"grad_norm": 0.5232814265115104,
|
|
"learning_rate": 2.0941984200827402e-05,
|
|
"loss": 0.2503,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0992535650730133,
|
|
"step": 2585,
|
|
"valid_targets_mean": 2465.5,
|
|
"valid_targets_min": 607
|
|
},
|
|
{
|
|
"epoch": 3.7645348837209305,
|
|
"grad_norm": 0.5258965525649895,
|
|
"learning_rate": 2.0869571477322244e-05,
|
|
"loss": 0.2449,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13085459172725677,
|
|
"step": 2590,
|
|
"valid_targets_mean": 3935.5,
|
|
"valid_targets_min": 763
|
|
},
|
|
{
|
|
"epoch": 3.7718023255813953,
|
|
"grad_norm": 0.44500756957595106,
|
|
"learning_rate": 2.079714733117021e-05,
|
|
"loss": 0.2455,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11444681882858276,
|
|
"step": 2595,
|
|
"valid_targets_mean": 3957.0,
|
|
"valid_targets_min": 550
|
|
},
|
|
{
|
|
"epoch": 3.7790697674418605,
|
|
"grad_norm": 0.5892004703984094,
|
|
"learning_rate": 2.0724712713731226e-05,
|
|
"loss": 0.2485,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15046679973602295,
|
|
"step": 2600,
|
|
"valid_targets_mean": 4229.1,
|
|
"valid_targets_min": 580
|
|
},
|
|
{
|
|
"epoch": 3.7863372093023253,
|
|
"grad_norm": 0.47684359150895883,
|
|
"learning_rate": 2.065226857650275e-05,
|
|
"loss": 0.2429,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1092211902141571,
|
|
"step": 2605,
|
|
"valid_targets_mean": 3531.9,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 3.7936046511627906,
|
|
"grad_norm": 0.5363383293906026,
|
|
"learning_rate": 2.0579815871107304e-05,
|
|
"loss": 0.2548,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16444739699363708,
|
|
"step": 2610,
|
|
"valid_targets_mean": 4181.2,
|
|
"valid_targets_min": 1082
|
|
},
|
|
{
|
|
"epoch": 3.800872093023256,
|
|
"grad_norm": 0.526393012658088,
|
|
"learning_rate": 2.0507355549279948e-05,
|
|
"loss": 0.2563,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.123906210064888,
|
|
"step": 2615,
|
|
"valid_targets_mean": 3755.0,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 3.808139534883721,
|
|
"grad_norm": 0.5722494539766595,
|
|
"learning_rate": 2.04348885628558e-05,
|
|
"loss": 0.2539,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10296878218650818,
|
|
"step": 2620,
|
|
"valid_targets_mean": 2965.0,
|
|
"valid_targets_min": 762
|
|
},
|
|
{
|
|
"epoch": 3.8154069767441863,
|
|
"grad_norm": 0.48156563178261913,
|
|
"learning_rate": 2.036241586375753e-05,
|
|
"loss": 0.2587,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11730596423149109,
|
|
"step": 2625,
|
|
"valid_targets_mean": 3191.0,
|
|
"valid_targets_min": 784
|
|
},
|
|
{
|
|
"epoch": 3.822674418604651,
|
|
"grad_norm": 0.45226777167929455,
|
|
"learning_rate": 2.0289938403982834e-05,
|
|
"loss": 0.2573,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12582166492938995,
|
|
"step": 2630,
|
|
"valid_targets_mean": 4109.1,
|
|
"valid_targets_min": 440
|
|
},
|
|
{
|
|
"epoch": 3.8299418604651163,
|
|
"grad_norm": 0.5165198595050065,
|
|
"learning_rate": 2.0217457135591957e-05,
|
|
"loss": 0.2504,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12305717170238495,
|
|
"step": 2635,
|
|
"valid_targets_mean": 3467.5,
|
|
"valid_targets_min": 672
|
|
},
|
|
{
|
|
"epoch": 3.8372093023255816,
|
|
"grad_norm": 0.4587107429102401,
|
|
"learning_rate": 2.0144973010695157e-05,
|
|
"loss": 0.2381,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11890917271375656,
|
|
"step": 2640,
|
|
"valid_targets_mean": 4045.8,
|
|
"valid_targets_min": 497
|
|
},
|
|
{
|
|
"epoch": 3.8444767441860463,
|
|
"grad_norm": 0.4206311855873854,
|
|
"learning_rate": 2.0072486981440237e-05,
|
|
"loss": 0.2644,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1283896565437317,
|
|
"step": 2645,
|
|
"valid_targets_mean": 5033.2,
|
|
"valid_targets_min": 430
|
|
},
|
|
{
|
|
"epoch": 3.8517441860465116,
|
|
"grad_norm": 0.5199399403871814,
|
|
"learning_rate": 2e-05,
|
|
"loss": 0.2434,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13101065158843994,
|
|
"step": 2650,
|
|
"valid_targets_mean": 4126.1,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 3.859011627906977,
|
|
"grad_norm": 0.530627097236436,
|
|
"learning_rate": 1.9927513018559767e-05,
|
|
"loss": 0.2588,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14129270613193512,
|
|
"step": 2655,
|
|
"valid_targets_mean": 3838.5,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 3.866279069767442,
|
|
"grad_norm": 0.5182581748716937,
|
|
"learning_rate": 1.985502698930485e-05,
|
|
"loss": 0.2484,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11419911682605743,
|
|
"step": 2660,
|
|
"valid_targets_mean": 3422.4,
|
|
"valid_targets_min": 470
|
|
},
|
|
{
|
|
"epoch": 3.873546511627907,
|
|
"grad_norm": 0.637313644513782,
|
|
"learning_rate": 1.978254286440805e-05,
|
|
"loss": 0.256,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13794487714767456,
|
|
"step": 2665,
|
|
"valid_targets_mean": 2414.5,
|
|
"valid_targets_min": 486
|
|
},
|
|
{
|
|
"epoch": 3.880813953488372,
|
|
"grad_norm": 0.5972117317746191,
|
|
"learning_rate": 1.9710061596017172e-05,
|
|
"loss": 0.2522,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10965625196695328,
|
|
"step": 2670,
|
|
"valid_targets_mean": 2143.2,
|
|
"valid_targets_min": 343
|
|
},
|
|
{
|
|
"epoch": 3.8880813953488373,
|
|
"grad_norm": 0.49321698475016185,
|
|
"learning_rate": 1.9637584136242474e-05,
|
|
"loss": 0.2443,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11436263471841812,
|
|
"step": 2675,
|
|
"valid_targets_mean": 3455.9,
|
|
"valid_targets_min": 834
|
|
},
|
|
{
|
|
"epoch": 3.895348837209302,
|
|
"grad_norm": 0.45465791335008415,
|
|
"learning_rate": 1.9565111437144204e-05,
|
|
"loss": 0.2456,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12260943651199341,
|
|
"step": 2680,
|
|
"valid_targets_mean": 3845.8,
|
|
"valid_targets_min": 649
|
|
},
|
|
{
|
|
"epoch": 3.9026162790697674,
|
|
"grad_norm": 0.4530349993977751,
|
|
"learning_rate": 1.949264445072006e-05,
|
|
"loss": 0.2362,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1056285873055458,
|
|
"step": 2685,
|
|
"valid_targets_mean": 4397.9,
|
|
"valid_targets_min": 3450
|
|
},
|
|
{
|
|
"epoch": 3.9098837209302326,
|
|
"grad_norm": 0.5537681968399243,
|
|
"learning_rate": 1.9420184128892702e-05,
|
|
"loss": 0.2542,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1130150854587555,
|
|
"step": 2690,
|
|
"valid_targets_mean": 2776.1,
|
|
"valid_targets_min": 590
|
|
},
|
|
{
|
|
"epoch": 3.917151162790698,
|
|
"grad_norm": 0.49150433914817926,
|
|
"learning_rate": 1.9347731423497255e-05,
|
|
"loss": 0.2389,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10140958428382874,
|
|
"step": 2695,
|
|
"valid_targets_mean": 2692.9,
|
|
"valid_targets_min": 264
|
|
},
|
|
{
|
|
"epoch": 3.9244186046511627,
|
|
"grad_norm": 0.463733543118443,
|
|
"learning_rate": 1.927528728626878e-05,
|
|
"loss": 0.2448,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08858418464660645,
|
|
"step": 2700,
|
|
"valid_targets_mean": 3079.4,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 3.931686046511628,
|
|
"grad_norm": 0.43522051270813206,
|
|
"learning_rate": 1.9202852668829796e-05,
|
|
"loss": 0.2359,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10103869438171387,
|
|
"step": 2705,
|
|
"valid_targets_mean": 3345.5,
|
|
"valid_targets_min": 355
|
|
},
|
|
{
|
|
"epoch": 3.938953488372093,
|
|
"grad_norm": 0.529140425090723,
|
|
"learning_rate": 1.9130428522677762e-05,
|
|
"loss": 0.26,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13211511075496674,
|
|
"step": 2710,
|
|
"valid_targets_mean": 3707.6,
|
|
"valid_targets_min": 200
|
|
},
|
|
{
|
|
"epoch": 3.946220930232558,
|
|
"grad_norm": 0.5146828971465376,
|
|
"learning_rate": 1.90580157991726e-05,
|
|
"loss": 0.2491,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16741503775119781,
|
|
"step": 2715,
|
|
"valid_targets_mean": 4682.1,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 3.953488372093023,
|
|
"grad_norm": 0.48420609335106185,
|
|
"learning_rate": 1.898561544952417e-05,
|
|
"loss": 0.2498,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10657159984111786,
|
|
"step": 2720,
|
|
"valid_targets_mean": 4151.6,
|
|
"valid_targets_min": 806
|
|
},
|
|
{
|
|
"epoch": 3.9607558139534884,
|
|
"grad_norm": 0.5015110455391134,
|
|
"learning_rate": 1.8913228424779807e-05,
|
|
"loss": 0.2591,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1371941715478897,
|
|
"step": 2725,
|
|
"valid_targets_mean": 4309.9,
|
|
"valid_targets_min": 454
|
|
},
|
|
{
|
|
"epoch": 3.9680232558139537,
|
|
"grad_norm": 0.4908011439298694,
|
|
"learning_rate": 1.8840855675811788e-05,
|
|
"loss": 0.2475,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12342453002929688,
|
|
"step": 2730,
|
|
"valid_targets_mean": 3556.0,
|
|
"valid_targets_min": 417
|
|
},
|
|
{
|
|
"epoch": 3.9752906976744184,
|
|
"grad_norm": 0.5588263603143331,
|
|
"learning_rate": 1.876849815330488e-05,
|
|
"loss": 0.2443,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13135354220867157,
|
|
"step": 2735,
|
|
"valid_targets_mean": 2600.1,
|
|
"valid_targets_min": 418
|
|
},
|
|
{
|
|
"epoch": 3.9825581395348837,
|
|
"grad_norm": 0.47777874175500507,
|
|
"learning_rate": 1.869615680774384e-05,
|
|
"loss": 0.2465,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12580084800720215,
|
|
"step": 2740,
|
|
"valid_targets_mean": 4400.2,
|
|
"valid_targets_min": 3574
|
|
},
|
|
{
|
|
"epoch": 3.989825581395349,
|
|
"grad_norm": 0.44558810186639114,
|
|
"learning_rate": 1.862383258940091e-05,
|
|
"loss": 0.2506,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13136231899261475,
|
|
"step": 2745,
|
|
"valid_targets_mean": 4948.2,
|
|
"valid_targets_min": 3743
|
|
},
|
|
{
|
|
"epoch": 3.9970930232558137,
|
|
"grad_norm": 0.5080444419554163,
|
|
"learning_rate": 1.8551526448323366e-05,
|
|
"loss": 0.2565,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12025821208953857,
|
|
"step": 2750,
|
|
"valid_targets_mean": 3291.0,
|
|
"valid_targets_min": 752
|
|
},
|
|
{
|
|
"epoch": 4.004360465116279,
|
|
"grad_norm": 0.48352137501238807,
|
|
"learning_rate": 1.8479239334321005e-05,
|
|
"loss": 0.2407,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09484989941120148,
|
|
"step": 2755,
|
|
"valid_targets_mean": 2745.0,
|
|
"valid_targets_min": 578
|
|
},
|
|
{
|
|
"epoch": 4.011627906976744,
|
|
"grad_norm": 0.47367899779143086,
|
|
"learning_rate": 1.84069721969537e-05,
|
|
"loss": 0.2441,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1370040476322174,
|
|
"step": 2760,
|
|
"valid_targets_mean": 4967.2,
|
|
"valid_targets_min": 3396
|
|
},
|
|
{
|
|
"epoch": 4.0188953488372094,
|
|
"grad_norm": 0.54231002499266,
|
|
"learning_rate": 1.8334725985518898e-05,
|
|
"loss": 0.2303,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13151651620864868,
|
|
"step": 2765,
|
|
"valid_targets_mean": 3523.4,
|
|
"valid_targets_min": 542
|
|
},
|
|
{
|
|
"epoch": 4.026162790697675,
|
|
"grad_norm": 0.5238485007583942,
|
|
"learning_rate": 1.8262501649039178e-05,
|
|
"loss": 0.2244,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12579235434532166,
|
|
"step": 2770,
|
|
"valid_targets_mean": 4157.2,
|
|
"valid_targets_min": 742
|
|
},
|
|
{
|
|
"epoch": 4.03343023255814,
|
|
"grad_norm": 0.45102153752627877,
|
|
"learning_rate": 1.819030013624977e-05,
|
|
"loss": 0.2225,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1172993928194046,
|
|
"step": 2775,
|
|
"valid_targets_mean": 4752.1,
|
|
"valid_targets_min": 946
|
|
},
|
|
{
|
|
"epoch": 4.040697674418604,
|
|
"grad_norm": 0.5285857229676709,
|
|
"learning_rate": 1.8118122395586076e-05,
|
|
"loss": 0.2299,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10665304958820343,
|
|
"step": 2780,
|
|
"valid_targets_mean": 3128.1,
|
|
"valid_targets_min": 343
|
|
},
|
|
{
|
|
"epoch": 4.0479651162790695,
|
|
"grad_norm": 0.5909177336340645,
|
|
"learning_rate": 1.8045969375171257e-05,
|
|
"loss": 0.2274,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08512631803750992,
|
|
"step": 2785,
|
|
"valid_targets_mean": 2385.5,
|
|
"valid_targets_min": 587
|
|
},
|
|
{
|
|
"epoch": 4.055232558139535,
|
|
"grad_norm": 0.5095522606610547,
|
|
"learning_rate": 1.797384202280371e-05,
|
|
"loss": 0.2341,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1267683058977127,
|
|
"step": 2790,
|
|
"valid_targets_mean": 4405.8,
|
|
"valid_targets_min": 900
|
|
},
|
|
{
|
|
"epoch": 4.0625,
|
|
"grad_norm": 0.5144409488432192,
|
|
"learning_rate": 1.7901741285944703e-05,
|
|
"loss": 0.2428,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08859217166900635,
|
|
"step": 2795,
|
|
"valid_targets_mean": 2686.4,
|
|
"valid_targets_min": 547
|
|
},
|
|
{
|
|
"epoch": 4.069767441860465,
|
|
"grad_norm": 0.4876395280578797,
|
|
"learning_rate": 1.782966811170585e-05,
|
|
"loss": 0.2292,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10345523804426193,
|
|
"step": 2800,
|
|
"valid_targets_mean": 3438.8,
|
|
"valid_targets_min": 577
|
|
},
|
|
{
|
|
"epoch": 4.0770348837209305,
|
|
"grad_norm": 0.5231245613946751,
|
|
"learning_rate": 1.7757623446836718e-05,
|
|
"loss": 0.2364,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11259502172470093,
|
|
"step": 2805,
|
|
"valid_targets_mean": 3414.0,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 4.084302325581396,
|
|
"grad_norm": 0.6811959784490158,
|
|
"learning_rate": 1.768560823771238e-05,
|
|
"loss": 0.2415,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12798871099948883,
|
|
"step": 2810,
|
|
"valid_targets_mean": 2597.0,
|
|
"valid_targets_min": 567
|
|
},
|
|
{
|
|
"epoch": 4.09156976744186,
|
|
"grad_norm": 0.48633463675024335,
|
|
"learning_rate": 1.761362343032097e-05,
|
|
"loss": 0.2312,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1147952675819397,
|
|
"step": 2815,
|
|
"valid_targets_mean": 4718.0,
|
|
"valid_targets_min": 727
|
|
},
|
|
{
|
|
"epoch": 4.098837209302325,
|
|
"grad_norm": 0.49148880429117153,
|
|
"learning_rate": 1.754166997025127e-05,
|
|
"loss": 0.2305,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10578566789627075,
|
|
"step": 2820,
|
|
"valid_targets_mean": 3059.4,
|
|
"valid_targets_min": 441
|
|
},
|
|
{
|
|
"epoch": 4.1061046511627906,
|
|
"grad_norm": 0.5393816683284496,
|
|
"learning_rate": 1.7469748802680284e-05,
|
|
"loss": 0.2419,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1297258585691452,
|
|
"step": 2825,
|
|
"valid_targets_mean": 3596.8,
|
|
"valid_targets_min": 427
|
|
},
|
|
{
|
|
"epoch": 4.113372093023256,
|
|
"grad_norm": 0.47219143164141136,
|
|
"learning_rate": 1.739786087236083e-05,
|
|
"loss": 0.2266,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10674222558736801,
|
|
"step": 2830,
|
|
"valid_targets_mean": 3580.6,
|
|
"valid_targets_min": 509
|
|
},
|
|
{
|
|
"epoch": 4.120639534883721,
|
|
"grad_norm": 0.6061970319339015,
|
|
"learning_rate": 1.7326007123609123e-05,
|
|
"loss": 0.2294,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1318361610174179,
|
|
"step": 2835,
|
|
"valid_targets_mean": 4211.0,
|
|
"valid_targets_min": 568
|
|
},
|
|
{
|
|
"epoch": 4.127906976744186,
|
|
"grad_norm": 0.5711398358480915,
|
|
"learning_rate": 1.7254188500292355e-05,
|
|
"loss": 0.2492,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10918092727661133,
|
|
"step": 2840,
|
|
"valid_targets_mean": 2878.5,
|
|
"valid_targets_min": 728
|
|
},
|
|
{
|
|
"epoch": 4.1351744186046515,
|
|
"grad_norm": 0.5016679889674767,
|
|
"learning_rate": 1.718240594581633e-05,
|
|
"loss": 0.2389,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11699994653463364,
|
|
"step": 2845,
|
|
"valid_targets_mean": 4029.2,
|
|
"valid_targets_min": 837
|
|
},
|
|
{
|
|
"epoch": 4.142441860465116,
|
|
"grad_norm": 0.5587655319921159,
|
|
"learning_rate": 1.7110660403113045e-05,
|
|
"loss": 0.2469,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12280265986919403,
|
|
"step": 2850,
|
|
"valid_targets_mean": 3420.0,
|
|
"valid_targets_min": 608
|
|
},
|
|
{
|
|
"epoch": 4.149709302325581,
|
|
"grad_norm": 0.5700563652644026,
|
|
"learning_rate": 1.7038952814628312e-05,
|
|
"loss": 0.2403,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09359048306941986,
|
|
"step": 2855,
|
|
"valid_targets_mean": 2218.0,
|
|
"valid_targets_min": 433
|
|
},
|
|
{
|
|
"epoch": 4.156976744186046,
|
|
"grad_norm": 0.5315568391996941,
|
|
"learning_rate": 1.6967284122309385e-05,
|
|
"loss": 0.2374,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10375300794839859,
|
|
"step": 2860,
|
|
"valid_targets_mean": 2193.4,
|
|
"valid_targets_min": 603
|
|
},
|
|
{
|
|
"epoch": 4.164244186046512,
|
|
"grad_norm": 0.46104529117658105,
|
|
"learning_rate": 1.6895655267592567e-05,
|
|
"loss": 0.2343,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13019639253616333,
|
|
"step": 2865,
|
|
"valid_targets_mean": 5004.2,
|
|
"valid_targets_min": 4129
|
|
},
|
|
{
|
|
"epoch": 4.171511627906977,
|
|
"grad_norm": 0.5017086926945395,
|
|
"learning_rate": 1.6824067191390872e-05,
|
|
"loss": 0.238,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12526315450668335,
|
|
"step": 2870,
|
|
"valid_targets_mean": 3909.9,
|
|
"valid_targets_min": 665
|
|
},
|
|
{
|
|
"epoch": 4.178779069767442,
|
|
"grad_norm": 0.4971611429298911,
|
|
"learning_rate": 1.675252083408164e-05,
|
|
"loss": 0.2295,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10105648636817932,
|
|
"step": 2875,
|
|
"valid_targets_mean": 3390.0,
|
|
"valid_targets_min": 810
|
|
},
|
|
{
|
|
"epoch": 4.186046511627907,
|
|
"grad_norm": 0.63719445496211,
|
|
"learning_rate": 1.6681017135494194e-05,
|
|
"loss": 0.2324,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12060322612524033,
|
|
"step": 2880,
|
|
"valid_targets_mean": 2759.0,
|
|
"valid_targets_min": 700
|
|
},
|
|
{
|
|
"epoch": 4.1933139534883725,
|
|
"grad_norm": 0.6313240833284652,
|
|
"learning_rate": 1.66095570348975e-05,
|
|
"loss": 0.2362,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14655247330665588,
|
|
"step": 2885,
|
|
"valid_targets_mean": 3164.0,
|
|
"valid_targets_min": 688
|
|
},
|
|
{
|
|
"epoch": 4.200581395348837,
|
|
"grad_norm": 0.48700081990187133,
|
|
"learning_rate": 1.653814147098781e-05,
|
|
"loss": 0.2374,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11685729026794434,
|
|
"step": 2890,
|
|
"valid_targets_mean": 4256.5,
|
|
"valid_targets_min": 885
|
|
},
|
|
{
|
|
"epoch": 4.207848837209302,
|
|
"grad_norm": 0.6232894954120523,
|
|
"learning_rate": 1.6466771381876365e-05,
|
|
"loss": 0.2351,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11992734670639038,
|
|
"step": 2895,
|
|
"valid_targets_mean": 3321.0,
|
|
"valid_targets_min": 662
|
|
},
|
|
{
|
|
"epoch": 4.215116279069767,
|
|
"grad_norm": 0.4917083432054533,
|
|
"learning_rate": 1.639544770507703e-05,
|
|
"loss": 0.2366,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12429793179035187,
|
|
"step": 2900,
|
|
"valid_targets_mean": 4300.4,
|
|
"valid_targets_min": 286
|
|
},
|
|
{
|
|
"epoch": 4.222383720930233,
|
|
"grad_norm": 0.5210145808392682,
|
|
"learning_rate": 1.6324171377494015e-05,
|
|
"loss": 0.2399,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11657124012708664,
|
|
"step": 2905,
|
|
"valid_targets_mean": 3128.8,
|
|
"valid_targets_min": 749
|
|
},
|
|
{
|
|
"epoch": 4.229651162790698,
|
|
"grad_norm": 0.5162901164850011,
|
|
"learning_rate": 1.6252943335409542e-05,
|
|
"loss": 0.233,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10562814772129059,
|
|
"step": 2910,
|
|
"valid_targets_mean": 3470.4,
|
|
"valid_targets_min": 679
|
|
},
|
|
{
|
|
"epoch": 4.236918604651163,
|
|
"grad_norm": 0.564598628475888,
|
|
"learning_rate": 1.6181764514471566e-05,
|
|
"loss": 0.231,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09816817939281464,
|
|
"step": 2915,
|
|
"valid_targets_mean": 2720.0,
|
|
"valid_targets_min": 545
|
|
},
|
|
{
|
|
"epoch": 4.2441860465116275,
|
|
"grad_norm": 0.5262034337491491,
|
|
"learning_rate": 1.611063584968148e-05,
|
|
"loss": 0.2266,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14536155760288239,
|
|
"step": 2920,
|
|
"valid_targets_mean": 4571.6,
|
|
"valid_targets_min": 868
|
|
},
|
|
{
|
|
"epoch": 4.251453488372093,
|
|
"grad_norm": 0.5443324066129965,
|
|
"learning_rate": 1.6039558275381812e-05,
|
|
"loss": 0.243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08932915329933167,
|
|
"step": 2925,
|
|
"valid_targets_mean": 2445.5,
|
|
"valid_targets_min": 691
|
|
},
|
|
{
|
|
"epoch": 4.258720930232558,
|
|
"grad_norm": 0.524434173056238,
|
|
"learning_rate": 1.596853272524398e-05,
|
|
"loss": 0.2305,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12700089812278748,
|
|
"step": 2930,
|
|
"valid_targets_mean": 4030.2,
|
|
"valid_targets_min": 459
|
|
},
|
|
{
|
|
"epoch": 4.265988372093023,
|
|
"grad_norm": 0.6159042780695054,
|
|
"learning_rate": 1.5897560132256008e-05,
|
|
"loss": 0.2348,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09032024443149567,
|
|
"step": 2935,
|
|
"valid_targets_mean": 2270.6,
|
|
"valid_targets_min": 565
|
|
},
|
|
{
|
|
"epoch": 4.273255813953488,
|
|
"grad_norm": 0.5937855344203165,
|
|
"learning_rate": 1.582664142871029e-05,
|
|
"loss": 0.2459,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1407282054424286,
|
|
"step": 2940,
|
|
"valid_targets_mean": 3228.5,
|
|
"valid_targets_min": 654
|
|
},
|
|
{
|
|
"epoch": 4.280523255813954,
|
|
"grad_norm": 0.544590296799247,
|
|
"learning_rate": 1.5755777546191313e-05,
|
|
"loss": 0.2202,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08907799422740936,
|
|
"step": 2945,
|
|
"valid_targets_mean": 2940.5,
|
|
"valid_targets_min": 597
|
|
},
|
|
{
|
|
"epoch": 4.287790697674419,
|
|
"grad_norm": 0.5014969531374299,
|
|
"learning_rate": 1.5684969415563456e-05,
|
|
"loss": 0.2319,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13449829816818237,
|
|
"step": 2950,
|
|
"valid_targets_mean": 3845.8,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 4.295058139534884,
|
|
"grad_norm": 0.5494535644403714,
|
|
"learning_rate": 1.5614217966958725e-05,
|
|
"loss": 0.2385,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10309483855962753,
|
|
"step": 2955,
|
|
"valid_targets_mean": 2985.2,
|
|
"valid_targets_min": 698
|
|
},
|
|
{
|
|
"epoch": 4.3023255813953485,
|
|
"grad_norm": 0.4382128256233561,
|
|
"learning_rate": 1.554352412976457e-05,
|
|
"loss": 0.2318,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10149140655994415,
|
|
"step": 2960,
|
|
"valid_targets_mean": 4764.4,
|
|
"valid_targets_min": 3860
|
|
},
|
|
{
|
|
"epoch": 4.309593023255814,
|
|
"grad_norm": 0.5049094177590457,
|
|
"learning_rate": 1.5472888832611662e-05,
|
|
"loss": 0.2395,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13525943458080292,
|
|
"step": 2965,
|
|
"valid_targets_mean": 4419.8,
|
|
"valid_targets_min": 666
|
|
},
|
|
{
|
|
"epoch": 4.316860465116279,
|
|
"grad_norm": 0.6480364173889341,
|
|
"learning_rate": 1.5402313003361676e-05,
|
|
"loss": 0.2455,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08497101068496704,
|
|
"step": 2970,
|
|
"valid_targets_mean": 1814.9,
|
|
"valid_targets_min": 676
|
|
},
|
|
{
|
|
"epoch": 4.324127906976744,
|
|
"grad_norm": 0.6067490783183469,
|
|
"learning_rate": 1.533179756909513e-05,
|
|
"loss": 0.2526,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.20556490123271942,
|
|
"step": 2975,
|
|
"valid_targets_mean": 4119.9,
|
|
"valid_targets_min": 1004
|
|
},
|
|
{
|
|
"epoch": 4.3313953488372094,
|
|
"grad_norm": 0.6669582826595135,
|
|
"learning_rate": 1.52613434560992e-05,
|
|
"loss": 0.2355,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10513143986463547,
|
|
"step": 2980,
|
|
"valid_targets_mean": 2029.0,
|
|
"valid_targets_min": 359
|
|
},
|
|
{
|
|
"epoch": 4.338662790697675,
|
|
"grad_norm": 0.4563801791059827,
|
|
"learning_rate": 1.519095158985554e-05,
|
|
"loss": 0.2357,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1262395679950714,
|
|
"step": 2985,
|
|
"valid_targets_mean": 4772.6,
|
|
"valid_targets_min": 783
|
|
},
|
|
{
|
|
"epoch": 4.34593023255814,
|
|
"grad_norm": 0.4771548492793852,
|
|
"learning_rate": 1.512062289502814e-05,
|
|
"loss": 0.2331,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1244804859161377,
|
|
"step": 2990,
|
|
"valid_targets_mean": 4250.5,
|
|
"valid_targets_min": 595
|
|
},
|
|
{
|
|
"epoch": 4.353197674418604,
|
|
"grad_norm": 0.4968998207030734,
|
|
"learning_rate": 1.5050358295451173e-05,
|
|
"loss": 0.2347,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10179959237575531,
|
|
"step": 2995,
|
|
"valid_targets_mean": 2665.2,
|
|
"valid_targets_min": 553
|
|
},
|
|
{
|
|
"epoch": 4.3604651162790695,
|
|
"grad_norm": 0.5349989482615872,
|
|
"learning_rate": 1.4980158714116864e-05,
|
|
"loss": 0.2283,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12053326517343521,
|
|
"step": 3000,
|
|
"valid_targets_mean": 3655.0,
|
|
"valid_targets_min": 512
|
|
},
|
|
{
|
|
"epoch": 4.367732558139535,
|
|
"grad_norm": 0.45795082624788974,
|
|
"learning_rate": 1.4910025073163346e-05,
|
|
"loss": 0.2342,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11071191728115082,
|
|
"step": 3005,
|
|
"valid_targets_mean": 4073.0,
|
|
"valid_targets_min": 799
|
|
},
|
|
{
|
|
"epoch": 4.375,
|
|
"grad_norm": 0.5488486813247619,
|
|
"learning_rate": 1.4839958293862582e-05,
|
|
"loss": 0.2446,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11098312586545944,
|
|
"step": 3010,
|
|
"valid_targets_mean": 2934.9,
|
|
"valid_targets_min": 830
|
|
},
|
|
{
|
|
"epoch": 4.382267441860465,
|
|
"grad_norm": 0.4999364379943187,
|
|
"learning_rate": 1.4769959296608228e-05,
|
|
"loss": 0.2426,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11597448587417603,
|
|
"step": 3015,
|
|
"valid_targets_mean": 3370.1,
|
|
"valid_targets_min": 562
|
|
},
|
|
{
|
|
"epoch": 4.3895348837209305,
|
|
"grad_norm": 0.6797002456964418,
|
|
"learning_rate": 1.4700029000903575e-05,
|
|
"loss": 0.2412,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12890125811100006,
|
|
"step": 3020,
|
|
"valid_targets_mean": 1933.5,
|
|
"valid_targets_min": 418
|
|
},
|
|
{
|
|
"epoch": 4.396802325581396,
|
|
"grad_norm": 0.6080778703915236,
|
|
"learning_rate": 1.463016832534943e-05,
|
|
"loss": 0.2526,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12549175322055817,
|
|
"step": 3025,
|
|
"valid_targets_mean": 3266.6,
|
|
"valid_targets_min": 663
|
|
},
|
|
{
|
|
"epoch": 4.40406976744186,
|
|
"grad_norm": 0.5399637076155757,
|
|
"learning_rate": 1.4560378187632101e-05,
|
|
"loss": 0.2349,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10789905488491058,
|
|
"step": 3030,
|
|
"valid_targets_mean": 2986.1,
|
|
"valid_targets_min": 586
|
|
},
|
|
{
|
|
"epoch": 4.411337209302325,
|
|
"grad_norm": 0.5178778926974974,
|
|
"learning_rate": 1.4490659504511295e-05,
|
|
"loss": 0.2423,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09591800719499588,
|
|
"step": 3035,
|
|
"valid_targets_mean": 3687.2,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 4.4186046511627906,
|
|
"grad_norm": 0.5030583012505943,
|
|
"learning_rate": 1.44210131918081e-05,
|
|
"loss": 0.2309,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.121453195810318,
|
|
"step": 3040,
|
|
"valid_targets_mean": 4075.1,
|
|
"valid_targets_min": 569
|
|
},
|
|
{
|
|
"epoch": 4.425872093023256,
|
|
"grad_norm": 0.5641263917257686,
|
|
"learning_rate": 1.4351440164392956e-05,
|
|
"loss": 0.2356,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1182078868150711,
|
|
"step": 3045,
|
|
"valid_targets_mean": 3217.6,
|
|
"valid_targets_min": 607
|
|
},
|
|
{
|
|
"epoch": 4.433139534883721,
|
|
"grad_norm": 0.5939975448891784,
|
|
"learning_rate": 1.4281941336173621e-05,
|
|
"loss": 0.2305,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10988223552703857,
|
|
"step": 3050,
|
|
"valid_targets_mean": 2759.2,
|
|
"valid_targets_min": 535
|
|
},
|
|
{
|
|
"epoch": 4.440406976744186,
|
|
"grad_norm": 0.546560793902984,
|
|
"learning_rate": 1.4212517620083186e-05,
|
|
"loss": 0.2215,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08663086593151093,
|
|
"step": 3055,
|
|
"valid_targets_mean": 2932.1,
|
|
"valid_targets_min": 519
|
|
},
|
|
{
|
|
"epoch": 4.4476744186046515,
|
|
"grad_norm": 0.5318778359190953,
|
|
"learning_rate": 1.4143169928068061e-05,
|
|
"loss": 0.2333,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10948213934898376,
|
|
"step": 3060,
|
|
"valid_targets_mean": 3642.5,
|
|
"valid_targets_min": 729
|
|
},
|
|
{
|
|
"epoch": 4.454941860465116,
|
|
"grad_norm": 0.5341511378601346,
|
|
"learning_rate": 1.4073899171076022e-05,
|
|
"loss": 0.2287,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12564794719219208,
|
|
"step": 3065,
|
|
"valid_targets_mean": 3746.2,
|
|
"valid_targets_min": 720
|
|
},
|
|
{
|
|
"epoch": 4.462209302325581,
|
|
"grad_norm": 0.6152522741279195,
|
|
"learning_rate": 1.400470625904422e-05,
|
|
"loss": 0.2261,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09698937088251114,
|
|
"step": 3070,
|
|
"valid_targets_mean": 3055.4,
|
|
"valid_targets_min": 300
|
|
},
|
|
{
|
|
"epoch": 4.469476744186046,
|
|
"grad_norm": 0.4894759594735516,
|
|
"learning_rate": 1.3935592100887242e-05,
|
|
"loss": 0.2281,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09913764894008636,
|
|
"step": 3075,
|
|
"valid_targets_mean": 3156.9,
|
|
"valid_targets_min": 691
|
|
},
|
|
{
|
|
"epoch": 4.476744186046512,
|
|
"grad_norm": 0.5350561295503559,
|
|
"learning_rate": 1.386655760448517e-05,
|
|
"loss": 0.2353,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14611050486564636,
|
|
"step": 3080,
|
|
"valid_targets_mean": 5077.9,
|
|
"valid_targets_min": 3504
|
|
},
|
|
{
|
|
"epoch": 4.484011627906977,
|
|
"grad_norm": 0.5317175369468766,
|
|
"learning_rate": 1.3797603676671646e-05,
|
|
"loss": 0.2344,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09551812708377838,
|
|
"step": 3085,
|
|
"valid_targets_mean": 3002.4,
|
|
"valid_targets_min": 558
|
|
},
|
|
{
|
|
"epoch": 4.491279069767442,
|
|
"grad_norm": 0.4435122144509018,
|
|
"learning_rate": 1.372873122322198e-05,
|
|
"loss": 0.229,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0975491851568222,
|
|
"step": 3090,
|
|
"valid_targets_mean": 3885.2,
|
|
"valid_targets_min": 764
|
|
},
|
|
{
|
|
"epoch": 4.498546511627907,
|
|
"grad_norm": 0.5024935576623654,
|
|
"learning_rate": 1.365994114884122e-05,
|
|
"loss": 0.2391,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11409218609333038,
|
|
"step": 3095,
|
|
"valid_targets_mean": 4141.4,
|
|
"valid_targets_min": 587
|
|
},
|
|
{
|
|
"epoch": 4.5058139534883725,
|
|
"grad_norm": 0.5434331061009773,
|
|
"learning_rate": 1.359123435715231e-05,
|
|
"loss": 0.2357,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09311437606811523,
|
|
"step": 3100,
|
|
"valid_targets_mean": 2983.4,
|
|
"valid_targets_min": 815
|
|
},
|
|
{
|
|
"epoch": 4.513081395348837,
|
|
"grad_norm": 0.45263073099805023,
|
|
"learning_rate": 1.3522611750684171e-05,
|
|
"loss": 0.2297,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11372917890548706,
|
|
"step": 3105,
|
|
"valid_targets_mean": 3772.0,
|
|
"valid_targets_min": 431
|
|
},
|
|
{
|
|
"epoch": 4.520348837209302,
|
|
"grad_norm": 0.6272229613079687,
|
|
"learning_rate": 1.3454074230859896e-05,
|
|
"loss": 0.2428,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16346322000026703,
|
|
"step": 3110,
|
|
"valid_targets_mean": 3129.0,
|
|
"valid_targets_min": 552
|
|
},
|
|
{
|
|
"epoch": 4.527616279069767,
|
|
"grad_norm": 0.5038465829473497,
|
|
"learning_rate": 1.3385622697984872e-05,
|
|
"loss": 0.2332,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11544954776763916,
|
|
"step": 3115,
|
|
"valid_targets_mean": 3430.9,
|
|
"valid_targets_min": 395
|
|
},
|
|
{
|
|
"epoch": 4.534883720930233,
|
|
"grad_norm": 0.5887483028437017,
|
|
"learning_rate": 1.331725805123496e-05,
|
|
"loss": 0.2386,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10782928764820099,
|
|
"step": 3120,
|
|
"valid_targets_mean": 2734.6,
|
|
"valid_targets_min": 665
|
|
},
|
|
{
|
|
"epoch": 4.542151162790698,
|
|
"grad_norm": 0.5010126807103301,
|
|
"learning_rate": 1.3248981188644703e-05,
|
|
"loss": 0.2374,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15959912538528442,
|
|
"step": 3125,
|
|
"valid_targets_mean": 4801.8,
|
|
"valid_targets_min": 3198
|
|
},
|
|
{
|
|
"epoch": 4.549418604651163,
|
|
"grad_norm": 0.5303282635413874,
|
|
"learning_rate": 1.3180793007095502e-05,
|
|
"loss": 0.2296,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1328737735748291,
|
|
"step": 3130,
|
|
"valid_targets_mean": 3531.9,
|
|
"valid_targets_min": 916
|
|
},
|
|
{
|
|
"epoch": 4.5566860465116275,
|
|
"grad_norm": 0.48575033418771363,
|
|
"learning_rate": 1.3112694402303863e-05,
|
|
"loss": 0.2527,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16913628578186035,
|
|
"step": 3135,
|
|
"valid_targets_mean": 5586.6,
|
|
"valid_targets_min": 806
|
|
},
|
|
{
|
|
"epoch": 4.563953488372093,
|
|
"grad_norm": 0.48981867193444983,
|
|
"learning_rate": 1.3044686268809596e-05,
|
|
"loss": 0.2489,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13943105936050415,
|
|
"step": 3140,
|
|
"valid_targets_mean": 4203.0,
|
|
"valid_targets_min": 1091
|
|
},
|
|
{
|
|
"epoch": 4.571220930232558,
|
|
"grad_norm": 0.5305974079239972,
|
|
"learning_rate": 1.2976769499964109e-05,
|
|
"loss": 0.236,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15359435975551605,
|
|
"step": 3145,
|
|
"valid_targets_mean": 4305.5,
|
|
"valid_targets_min": 550
|
|
},
|
|
{
|
|
"epoch": 4.578488372093023,
|
|
"grad_norm": 0.5630598119690939,
|
|
"learning_rate": 1.2908944987918633e-05,
|
|
"loss": 0.2395,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15561619400978088,
|
|
"step": 3150,
|
|
"valid_targets_mean": 3796.2,
|
|
"valid_targets_min": 720
|
|
},
|
|
{
|
|
"epoch": 4.585755813953488,
|
|
"grad_norm": 0.4690829743543244,
|
|
"learning_rate": 1.2841213623612519e-05,
|
|
"loss": 0.2301,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10580013692378998,
|
|
"step": 3155,
|
|
"valid_targets_mean": 3367.6,
|
|
"valid_targets_min": 611
|
|
},
|
|
{
|
|
"epoch": 4.593023255813954,
|
|
"grad_norm": 0.5289397793275402,
|
|
"learning_rate": 1.2773576296761542e-05,
|
|
"loss": 0.2346,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13507477939128876,
|
|
"step": 3160,
|
|
"valid_targets_mean": 3805.9,
|
|
"valid_targets_min": 743
|
|
},
|
|
{
|
|
"epoch": 4.600290697674419,
|
|
"grad_norm": 0.5426964454812239,
|
|
"learning_rate": 1.2706033895846192e-05,
|
|
"loss": 0.2265,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09324119985103607,
|
|
"step": 3165,
|
|
"valid_targets_mean": 2972.5,
|
|
"valid_targets_min": 590
|
|
},
|
|
{
|
|
"epoch": 4.607558139534884,
|
|
"grad_norm": 0.5634432609885214,
|
|
"learning_rate": 1.2638587308100036e-05,
|
|
"loss": 0.2395,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11684857308864594,
|
|
"step": 3170,
|
|
"valid_targets_mean": 3209.4,
|
|
"valid_targets_min": 577
|
|
},
|
|
{
|
|
"epoch": 4.6148255813953485,
|
|
"grad_norm": 0.48953334327704895,
|
|
"learning_rate": 1.2571237419498018e-05,
|
|
"loss": 0.227,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11784234642982483,
|
|
"step": 3175,
|
|
"valid_targets_mean": 4379.2,
|
|
"valid_targets_min": 968
|
|
},
|
|
{
|
|
"epoch": 4.622093023255814,
|
|
"grad_norm": 0.5210611303116327,
|
|
"learning_rate": 1.2503985114744883e-05,
|
|
"loss": 0.2283,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10520151257514954,
|
|
"step": 3180,
|
|
"valid_targets_mean": 4008.8,
|
|
"valid_targets_min": 3184
|
|
},
|
|
{
|
|
"epoch": 4.629360465116279,
|
|
"grad_norm": 0.4773875572630403,
|
|
"learning_rate": 1.2436831277263481e-05,
|
|
"loss": 0.2497,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1177573874592781,
|
|
"step": 3185,
|
|
"valid_targets_mean": 3870.4,
|
|
"valid_targets_min": 670
|
|
},
|
|
{
|
|
"epoch": 4.636627906976744,
|
|
"grad_norm": 0.6583518666009744,
|
|
"learning_rate": 1.2369776789183234e-05,
|
|
"loss": 0.2417,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14675956964492798,
|
|
"step": 3190,
|
|
"valid_targets_mean": 3113.1,
|
|
"valid_targets_min": 677
|
|
},
|
|
{
|
|
"epoch": 4.6438953488372094,
|
|
"grad_norm": 0.4450353778257948,
|
|
"learning_rate": 1.230282253132849e-05,
|
|
"loss": 0.238,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11362966150045395,
|
|
"step": 3195,
|
|
"valid_targets_mean": 4771.6,
|
|
"valid_targets_min": 3887
|
|
},
|
|
{
|
|
"epoch": 4.651162790697675,
|
|
"grad_norm": 0.5094860056017274,
|
|
"learning_rate": 1.2235969383206987e-05,
|
|
"loss": 0.2459,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11538674682378769,
|
|
"step": 3200,
|
|
"valid_targets_mean": 3672.0,
|
|
"valid_targets_min": 509
|
|
},
|
|
{
|
|
"epoch": 4.658430232558139,
|
|
"grad_norm": 0.5084867559413941,
|
|
"learning_rate": 1.2169218222998294e-05,
|
|
"loss": 0.2293,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10229187458753586,
|
|
"step": 3205,
|
|
"valid_targets_mean": 3424.5,
|
|
"valid_targets_min": 755
|
|
},
|
|
{
|
|
"epoch": 4.665697674418604,
|
|
"grad_norm": 0.5637648552818592,
|
|
"learning_rate": 1.2102569927542275e-05,
|
|
"loss": 0.237,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12403546273708344,
|
|
"step": 3210,
|
|
"valid_targets_mean": 4107.8,
|
|
"valid_targets_min": 702
|
|
},
|
|
{
|
|
"epoch": 4.6729651162790695,
|
|
"grad_norm": 0.4948101308113288,
|
|
"learning_rate": 1.2036025372327553e-05,
|
|
"loss": 0.2292,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12994790077209473,
|
|
"step": 3215,
|
|
"valid_targets_mean": 3731.0,
|
|
"valid_targets_min": 547
|
|
},
|
|
{
|
|
"epoch": 4.680232558139535,
|
|
"grad_norm": 0.5394534093008194,
|
|
"learning_rate": 1.1969585431480037e-05,
|
|
"loss": 0.2418,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10351639986038208,
|
|
"step": 3220,
|
|
"valid_targets_mean": 3190.5,
|
|
"valid_targets_min": 689
|
|
},
|
|
{
|
|
"epoch": 4.6875,
|
|
"grad_norm": 0.4404560213423327,
|
|
"learning_rate": 1.1903250977751429e-05,
|
|
"loss": 0.2291,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09289942681789398,
|
|
"step": 3225,
|
|
"valid_targets_mean": 3678.2,
|
|
"valid_targets_min": 708
|
|
},
|
|
{
|
|
"epoch": 4.694767441860465,
|
|
"grad_norm": 0.5081100321617489,
|
|
"learning_rate": 1.1837022882507745e-05,
|
|
"loss": 0.2325,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12247206270694733,
|
|
"step": 3230,
|
|
"valid_targets_mean": 4082.9,
|
|
"valid_targets_min": 690
|
|
},
|
|
{
|
|
"epoch": 4.7020348837209305,
|
|
"grad_norm": 0.4441735432541099,
|
|
"learning_rate": 1.1770902015717894e-05,
|
|
"loss": 0.2303,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09333371371030807,
|
|
"step": 3235,
|
|
"valid_targets_mean": 3859.1,
|
|
"valid_targets_min": 614
|
|
},
|
|
{
|
|
"epoch": 4.709302325581396,
|
|
"grad_norm": 0.6011417337828853,
|
|
"learning_rate": 1.1704889245942229e-05,
|
|
"loss": 0.2349,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10990115255117416,
|
|
"step": 3240,
|
|
"valid_targets_mean": 2285.1,
|
|
"valid_targets_min": 522
|
|
},
|
|
{
|
|
"epoch": 4.716569767441861,
|
|
"grad_norm": 0.5021507632398494,
|
|
"learning_rate": 1.163898544032115e-05,
|
|
"loss": 0.2286,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11612962186336517,
|
|
"step": 3245,
|
|
"valid_targets_mean": 3578.5,
|
|
"valid_targets_min": 776
|
|
},
|
|
{
|
|
"epoch": 4.723837209302325,
|
|
"grad_norm": 0.5880169464524365,
|
|
"learning_rate": 1.1573191464563709e-05,
|
|
"loss": 0.2372,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09853021800518036,
|
|
"step": 3250,
|
|
"valid_targets_mean": 2618.2,
|
|
"valid_targets_min": 677
|
|
},
|
|
{
|
|
"epoch": 4.7311046511627906,
|
|
"grad_norm": 0.48959783668226775,
|
|
"learning_rate": 1.1507508182936231e-05,
|
|
"loss": 0.242,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09494741261005402,
|
|
"step": 3255,
|
|
"valid_targets_mean": 3397.2,
|
|
"valid_targets_min": 698
|
|
},
|
|
{
|
|
"epoch": 4.738372093023256,
|
|
"grad_norm": 0.46056950109789613,
|
|
"learning_rate": 1.144193645825099e-05,
|
|
"loss": 0.2338,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12248848378658295,
|
|
"step": 3260,
|
|
"valid_targets_mean": 4731.5,
|
|
"valid_targets_min": 507
|
|
},
|
|
{
|
|
"epoch": 4.745639534883721,
|
|
"grad_norm": 0.5214044669092526,
|
|
"learning_rate": 1.1376477151854832e-05,
|
|
"loss": 0.2282,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11522860825061798,
|
|
"step": 3265,
|
|
"valid_targets_mean": 3560.9,
|
|
"valid_targets_min": 566
|
|
},
|
|
{
|
|
"epoch": 4.752906976744186,
|
|
"grad_norm": 0.5820601949492391,
|
|
"learning_rate": 1.131113112361788e-05,
|
|
"loss": 0.2343,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12622776627540588,
|
|
"step": 3270,
|
|
"valid_targets_mean": 3919.5,
|
|
"valid_targets_min": 471
|
|
},
|
|
{
|
|
"epoch": 4.7601744186046515,
|
|
"grad_norm": 0.4664751855760365,
|
|
"learning_rate": 1.1245899231922265e-05,
|
|
"loss": 0.2296,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12376340478658676,
|
|
"step": 3275,
|
|
"valid_targets_mean": 4601.4,
|
|
"valid_targets_min": 469
|
|
},
|
|
{
|
|
"epoch": 4.767441860465116,
|
|
"grad_norm": 0.6667212632991735,
|
|
"learning_rate": 1.1180782333650807e-05,
|
|
"loss": 0.2324,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09619486331939697,
|
|
"step": 3280,
|
|
"valid_targets_mean": 1562.5,
|
|
"valid_targets_min": 581
|
|
},
|
|
{
|
|
"epoch": 4.774709302325581,
|
|
"grad_norm": 0.45412715795498276,
|
|
"learning_rate": 1.1115781284175777e-05,
|
|
"loss": 0.2345,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12009938806295395,
|
|
"step": 3285,
|
|
"valid_targets_mean": 4625.8,
|
|
"valid_targets_min": 849
|
|
},
|
|
{
|
|
"epoch": 4.781976744186046,
|
|
"grad_norm": 0.5704599440014428,
|
|
"learning_rate": 1.1050896937347666e-05,
|
|
"loss": 0.2495,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0995192751288414,
|
|
"step": 3290,
|
|
"valid_targets_mean": 2872.5,
|
|
"valid_targets_min": 602
|
|
},
|
|
{
|
|
"epoch": 4.789244186046512,
|
|
"grad_norm": 0.49543292260155836,
|
|
"learning_rate": 1.098613014548398e-05,
|
|
"loss": 0.2369,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11472610384225845,
|
|
"step": 3295,
|
|
"valid_targets_mean": 3716.9,
|
|
"valid_targets_min": 684
|
|
},
|
|
{
|
|
"epoch": 4.796511627906977,
|
|
"grad_norm": 0.537807694105439,
|
|
"learning_rate": 1.0921481759358005e-05,
|
|
"loss": 0.2396,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13546626269817352,
|
|
"step": 3300,
|
|
"valid_targets_mean": 4543.0,
|
|
"valid_targets_min": 571
|
|
},
|
|
{
|
|
"epoch": 4.803779069767442,
|
|
"grad_norm": 0.5678524865707387,
|
|
"learning_rate": 1.0856952628187662e-05,
|
|
"loss": 0.231,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.06101011484861374,
|
|
"step": 3305,
|
|
"valid_targets_mean": 1192.0,
|
|
"valid_targets_min": 412
|
|
},
|
|
{
|
|
"epoch": 4.811046511627907,
|
|
"grad_norm": 0.49246729295539404,
|
|
"learning_rate": 1.079254359962436e-05,
|
|
"loss": 0.2336,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09559541195631027,
|
|
"step": 3310,
|
|
"valid_targets_mean": 3340.8,
|
|
"valid_targets_min": 647
|
|
},
|
|
{
|
|
"epoch": 4.8183139534883725,
|
|
"grad_norm": 0.4743174571088282,
|
|
"learning_rate": 1.0728255519741831e-05,
|
|
"loss": 0.2372,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13542385399341583,
|
|
"step": 3315,
|
|
"valid_targets_mean": 4489.4,
|
|
"valid_targets_min": 791
|
|
},
|
|
{
|
|
"epoch": 4.825581395348837,
|
|
"grad_norm": 0.4984821091753099,
|
|
"learning_rate": 1.066408923302503e-05,
|
|
"loss": 0.2455,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11396318674087524,
|
|
"step": 3320,
|
|
"valid_targets_mean": 3852.9,
|
|
"valid_targets_min": 447
|
|
},
|
|
{
|
|
"epoch": 4.832848837209302,
|
|
"grad_norm": 0.5098307423292979,
|
|
"learning_rate": 1.060004558235905e-05,
|
|
"loss": 0.2407,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12900030612945557,
|
|
"step": 3325,
|
|
"valid_targets_mean": 3694.8,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 4.840116279069767,
|
|
"grad_norm": 0.47560010661218727,
|
|
"learning_rate": 1.0536125409018043e-05,
|
|
"loss": 0.2304,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10933175683021545,
|
|
"step": 3330,
|
|
"valid_targets_mean": 3970.6,
|
|
"valid_targets_min": 513
|
|
},
|
|
{
|
|
"epoch": 4.847383720930233,
|
|
"grad_norm": 0.47044486233428945,
|
|
"learning_rate": 1.0472329552654172e-05,
|
|
"loss": 0.2293,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11043363064527512,
|
|
"step": 3335,
|
|
"valid_targets_mean": 3795.6,
|
|
"valid_targets_min": 578
|
|
},
|
|
{
|
|
"epoch": 4.854651162790698,
|
|
"grad_norm": 0.5639925542779571,
|
|
"learning_rate": 1.040865885128656e-05,
|
|
"loss": 0.2346,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10802865028381348,
|
|
"step": 3340,
|
|
"valid_targets_mean": 3206.9,
|
|
"valid_targets_min": 564
|
|
},
|
|
{
|
|
"epoch": 4.861918604651163,
|
|
"grad_norm": 0.446505868059933,
|
|
"learning_rate": 1.034511414129033e-05,
|
|
"loss": 0.253,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13078966736793518,
|
|
"step": 3345,
|
|
"valid_targets_mean": 5018.2,
|
|
"valid_targets_min": 652
|
|
},
|
|
{
|
|
"epoch": 4.8691860465116275,
|
|
"grad_norm": 0.5184499276874123,
|
|
"learning_rate": 1.0281696257385566e-05,
|
|
"loss": 0.2369,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12428499758243561,
|
|
"step": 3350,
|
|
"valid_targets_mean": 3502.9,
|
|
"valid_targets_min": 690
|
|
},
|
|
{
|
|
"epoch": 4.876453488372093,
|
|
"grad_norm": 0.5018714295797971,
|
|
"learning_rate": 1.0218406032626383e-05,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10743530094623566,
|
|
"step": 3355,
|
|
"valid_targets_mean": 3596.0,
|
|
"valid_targets_min": 731
|
|
},
|
|
{
|
|
"epoch": 4.883720930232558,
|
|
"grad_norm": 0.5735331401509087,
|
|
"learning_rate": 1.015524429838995e-05,
|
|
"loss": 0.2348,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10622027516365051,
|
|
"step": 3360,
|
|
"valid_targets_mean": 2885.0,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 4.890988372093023,
|
|
"grad_norm": 0.4840757316363492,
|
|
"learning_rate": 1.009221188436563e-05,
|
|
"loss": 0.2313,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1269492208957672,
|
|
"step": 3365,
|
|
"valid_targets_mean": 4277.8,
|
|
"valid_targets_min": 784
|
|
},
|
|
{
|
|
"epoch": 4.898255813953488,
|
|
"grad_norm": 0.49774705420226517,
|
|
"learning_rate": 1.0029309618544008e-05,
|
|
"loss": 0.2366,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13551053404808044,
|
|
"step": 3370,
|
|
"valid_targets_mean": 4511.5,
|
|
"valid_targets_min": 690
|
|
},
|
|
{
|
|
"epoch": 4.905523255813954,
|
|
"grad_norm": 0.6044199194468696,
|
|
"learning_rate": 9.966538327206055e-06,
|
|
"loss": 0.2414,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10581943392753601,
|
|
"step": 3375,
|
|
"valid_targets_mean": 2411.6,
|
|
"valid_targets_min": 507
|
|
},
|
|
{
|
|
"epoch": 4.912790697674419,
|
|
"grad_norm": 0.5239169019089047,
|
|
"learning_rate": 9.903898834912288e-06,
|
|
"loss": 0.2358,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12706102430820465,
|
|
"step": 3380,
|
|
"valid_targets_mean": 4133.9,
|
|
"valid_targets_min": 603
|
|
},
|
|
{
|
|
"epoch": 4.920058139534884,
|
|
"grad_norm": 0.6359657440783766,
|
|
"learning_rate": 9.8413919644919e-06,
|
|
"loss": 0.2605,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13760952651500702,
|
|
"step": 3385,
|
|
"valid_targets_mean": 3341.1,
|
|
"valid_targets_min": 579
|
|
},
|
|
{
|
|
"epoch": 4.9273255813953485,
|
|
"grad_norm": 0.526652947386687,
|
|
"learning_rate": 9.77901853703197e-06,
|
|
"loss": 0.2464,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12862738966941833,
|
|
"step": 3390,
|
|
"valid_targets_mean": 3435.9,
|
|
"valid_targets_min": 446
|
|
},
|
|
{
|
|
"epoch": 4.934593023255814,
|
|
"grad_norm": 0.5209569537688338,
|
|
"learning_rate": 9.716779371866674e-06,
|
|
"loss": 0.2372,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12216047942638397,
|
|
"step": 3395,
|
|
"valid_targets_mean": 3661.0,
|
|
"valid_targets_min": 641
|
|
},
|
|
{
|
|
"epoch": 4.941860465116279,
|
|
"grad_norm": 0.4874489939699638,
|
|
"learning_rate": 9.654675286566548e-06,
|
|
"loss": 0.2347,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09232984483242035,
|
|
"step": 3400,
|
|
"valid_targets_mean": 3675.9,
|
|
"valid_targets_min": 702
|
|
},
|
|
{
|
|
"epoch": 4.949127906976744,
|
|
"grad_norm": 0.5282339564188945,
|
|
"learning_rate": 9.592707096927704e-06,
|
|
"loss": 0.2219,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16324245929718018,
|
|
"step": 3405,
|
|
"valid_targets_mean": 4671.8,
|
|
"valid_targets_min": 398
|
|
},
|
|
{
|
|
"epoch": 4.9563953488372094,
|
|
"grad_norm": 0.522763578277042,
|
|
"learning_rate": 9.53087561696113e-06,
|
|
"loss": 0.2336,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10933259129524231,
|
|
"step": 3410,
|
|
"valid_targets_mean": 3505.0,
|
|
"valid_targets_min": 914
|
|
},
|
|
{
|
|
"epoch": 4.963662790697675,
|
|
"grad_norm": 0.5013393924009135,
|
|
"learning_rate": 9.469181658882034e-06,
|
|
"loss": 0.2459,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10687707364559174,
|
|
"step": 3415,
|
|
"valid_targets_mean": 3193.2,
|
|
"valid_targets_min": 802
|
|
},
|
|
{
|
|
"epoch": 4.970930232558139,
|
|
"grad_norm": 0.4813101013967105,
|
|
"learning_rate": 9.40762603309911e-06,
|
|
"loss": 0.238,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08028747141361237,
|
|
"step": 3420,
|
|
"valid_targets_mean": 2682.6,
|
|
"valid_targets_min": 430
|
|
},
|
|
{
|
|
"epoch": 4.978197674418604,
|
|
"grad_norm": 0.5220023231881794,
|
|
"learning_rate": 9.346209548203947e-06,
|
|
"loss": 0.2319,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13090111315250397,
|
|
"step": 3425,
|
|
"valid_targets_mean": 5490.4,
|
|
"valid_targets_min": 4037
|
|
},
|
|
{
|
|
"epoch": 4.9854651162790695,
|
|
"grad_norm": 0.47855880716995414,
|
|
"learning_rate": 9.284933010960364e-06,
|
|
"loss": 0.2512,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1151789128780365,
|
|
"step": 3430,
|
|
"valid_targets_mean": 4014.4,
|
|
"valid_targets_min": 735
|
|
},
|
|
{
|
|
"epoch": 4.992732558139535,
|
|
"grad_norm": 0.5519432983605355,
|
|
"learning_rate": 9.223797226293867e-06,
|
|
"loss": 0.231,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11323521286249161,
|
|
"step": 3435,
|
|
"valid_targets_mean": 3503.9,
|
|
"valid_targets_min": 667
|
|
},
|
|
{
|
|
"epoch": 5.0,
|
|
"grad_norm": 0.5180141428234212,
|
|
"learning_rate": 9.162802997281022e-06,
|
|
"loss": 0.2371,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14478221535682678,
|
|
"step": 3440,
|
|
"valid_targets_mean": 3696.8,
|
|
"valid_targets_min": 759
|
|
},
|
|
{
|
|
"epoch": 5.007267441860465,
|
|
"grad_norm": 0.5064465775517101,
|
|
"learning_rate": 9.10195112513892e-06,
|
|
"loss": 0.2274,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11103392392396927,
|
|
"step": 3445,
|
|
"valid_targets_mean": 3689.1,
|
|
"valid_targets_min": 527
|
|
},
|
|
{
|
|
"epoch": 5.0145348837209305,
|
|
"grad_norm": 0.5163608827235715,
|
|
"learning_rate": 9.041242409214686e-06,
|
|
"loss": 0.219,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10698623955249786,
|
|
"step": 3450,
|
|
"valid_targets_mean": 3850.9,
|
|
"valid_targets_min": 732
|
|
},
|
|
{
|
|
"epoch": 5.021802325581396,
|
|
"grad_norm": 0.5841669567924161,
|
|
"learning_rate": 8.980677646974926e-06,
|
|
"loss": 0.2222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.16529354453086853,
|
|
"step": 3455,
|
|
"valid_targets_mean": 4314.1,
|
|
"valid_targets_min": 636
|
|
},
|
|
{
|
|
"epoch": 5.02906976744186,
|
|
"grad_norm": 0.5776954665741999,
|
|
"learning_rate": 8.920257633995295e-06,
|
|
"loss": 0.2215,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12802791595458984,
|
|
"step": 3460,
|
|
"valid_targets_mean": 3402.9,
|
|
"valid_targets_min": 704
|
|
},
|
|
{
|
|
"epoch": 5.036337209302325,
|
|
"grad_norm": 0.5039901178948153,
|
|
"learning_rate": 8.85998316395001e-06,
|
|
"loss": 0.2304,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12501442432403564,
|
|
"step": 3465,
|
|
"valid_targets_mean": 4067.0,
|
|
"valid_targets_min": 806
|
|
},
|
|
{
|
|
"epoch": 5.0436046511627906,
|
|
"grad_norm": 0.5973873035633013,
|
|
"learning_rate": 8.799855028601472e-06,
|
|
"loss": 0.2313,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12955757975578308,
|
|
"step": 3470,
|
|
"valid_targets_mean": 3599.6,
|
|
"valid_targets_min": 621
|
|
},
|
|
{
|
|
"epoch": 5.050872093023256,
|
|
"grad_norm": 0.5425804505001001,
|
|
"learning_rate": 8.739874017789813e-06,
|
|
"loss": 0.223,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10548754036426544,
|
|
"step": 3475,
|
|
"valid_targets_mean": 2965.9,
|
|
"valid_targets_min": 238
|
|
},
|
|
{
|
|
"epoch": 5.058139534883721,
|
|
"grad_norm": 0.5200649497723702,
|
|
"learning_rate": 8.680040919422544e-06,
|
|
"loss": 0.2288,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13549460470676422,
|
|
"step": 3480,
|
|
"valid_targets_mean": 4974.2,
|
|
"valid_targets_min": 3582
|
|
},
|
|
{
|
|
"epoch": 5.065406976744186,
|
|
"grad_norm": 0.5864066094152384,
|
|
"learning_rate": 8.620356519464228e-06,
|
|
"loss": 0.2262,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12549281120300293,
|
|
"step": 3485,
|
|
"valid_targets_mean": 4444.4,
|
|
"valid_targets_min": 672
|
|
},
|
|
{
|
|
"epoch": 5.0726744186046515,
|
|
"grad_norm": 0.5523220644419992,
|
|
"learning_rate": 8.560821601926112e-06,
|
|
"loss": 0.2416,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11209696531295776,
|
|
"step": 3490,
|
|
"valid_targets_mean": 3835.5,
|
|
"valid_targets_min": 582
|
|
},
|
|
{
|
|
"epoch": 5.079941860465116,
|
|
"grad_norm": 0.5657939357844483,
|
|
"learning_rate": 8.501436948855857e-06,
|
|
"loss": 0.2155,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10303827375173569,
|
|
"step": 3495,
|
|
"valid_targets_mean": 3019.0,
|
|
"valid_targets_min": 773
|
|
},
|
|
{
|
|
"epoch": 5.087209302325581,
|
|
"grad_norm": 0.5147529737841077,
|
|
"learning_rate": 8.44220334032725e-06,
|
|
"loss": 0.2137,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11031322181224823,
|
|
"step": 3500,
|
|
"valid_targets_mean": 3997.8,
|
|
"valid_targets_min": 542
|
|
},
|
|
{
|
|
"epoch": 5.094476744186046,
|
|
"grad_norm": 0.462171392787495,
|
|
"learning_rate": 8.383121554429985e-06,
|
|
"loss": 0.2239,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09460602700710297,
|
|
"step": 3505,
|
|
"valid_targets_mean": 3166.2,
|
|
"valid_targets_min": 603
|
|
},
|
|
{
|
|
"epoch": 5.101744186046512,
|
|
"grad_norm": 0.5004999228518526,
|
|
"learning_rate": 8.3241923672594e-06,
|
|
"loss": 0.222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11931440234184265,
|
|
"step": 3510,
|
|
"valid_targets_mean": 4244.2,
|
|
"valid_targets_min": 740
|
|
},
|
|
{
|
|
"epoch": 5.109011627906977,
|
|
"grad_norm": 0.5405328149776527,
|
|
"learning_rate": 8.265416552906316e-06,
|
|
"loss": 0.2308,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12601076066493988,
|
|
"step": 3515,
|
|
"valid_targets_mean": 4365.4,
|
|
"valid_targets_min": 759
|
|
},
|
|
{
|
|
"epoch": 5.116279069767442,
|
|
"grad_norm": 0.5425947774119614,
|
|
"learning_rate": 8.20679488344684e-06,
|
|
"loss": 0.2181,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10105065256357193,
|
|
"step": 3520,
|
|
"valid_targets_mean": 3867.1,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 5.123546511627907,
|
|
"grad_norm": 0.4766640353998748,
|
|
"learning_rate": 8.148328128932263e-06,
|
|
"loss": 0.2286,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10325950384140015,
|
|
"step": 3525,
|
|
"valid_targets_mean": 3969.1,
|
|
"valid_targets_min": 821
|
|
},
|
|
{
|
|
"epoch": 5.1308139534883725,
|
|
"grad_norm": 0.5279713250696507,
|
|
"learning_rate": 8.090017057378913e-06,
|
|
"loss": 0.2332,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10024862736463547,
|
|
"step": 3530,
|
|
"valid_targets_mean": 4346.2,
|
|
"valid_targets_min": 767
|
|
},
|
|
{
|
|
"epoch": 5.138081395348837,
|
|
"grad_norm": 0.6487999870575004,
|
|
"learning_rate": 8.03186243475807e-06,
|
|
"loss": 0.2325,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14460906386375427,
|
|
"step": 3535,
|
|
"valid_targets_mean": 3415.9,
|
|
"valid_targets_min": 773
|
|
},
|
|
{
|
|
"epoch": 5.145348837209302,
|
|
"grad_norm": 0.5270915274072561,
|
|
"learning_rate": 7.9738650249859e-06,
|
|
"loss": 0.2221,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11179886013269424,
|
|
"step": 3540,
|
|
"valid_targets_mean": 3993.8,
|
|
"valid_targets_min": 624
|
|
},
|
|
{
|
|
"epoch": 5.152616279069767,
|
|
"grad_norm": 0.5287461236460308,
|
|
"learning_rate": 7.916025589913452e-06,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11516192555427551,
|
|
"step": 3545,
|
|
"valid_targets_mean": 3947.0,
|
|
"valid_targets_min": 742
|
|
},
|
|
{
|
|
"epoch": 5.159883720930233,
|
|
"grad_norm": 0.5450827809641174,
|
|
"learning_rate": 7.858344889316611e-06,
|
|
"loss": 0.2212,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11309966444969177,
|
|
"step": 3550,
|
|
"valid_targets_mean": 3872.1,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 5.167151162790698,
|
|
"grad_norm": 0.4721896964111328,
|
|
"learning_rate": 7.80082368088613e-06,
|
|
"loss": 0.224,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1209426149725914,
|
|
"step": 3555,
|
|
"valid_targets_mean": 5368.0,
|
|
"valid_targets_min": 4502
|
|
},
|
|
{
|
|
"epoch": 5.174418604651163,
|
|
"grad_norm": 0.5628603862929638,
|
|
"learning_rate": 7.743462720217698e-06,
|
|
"loss": 0.2348,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09959325939416885,
|
|
"step": 3560,
|
|
"valid_targets_mean": 3553.9,
|
|
"valid_targets_min": 842
|
|
},
|
|
{
|
|
"epoch": 5.1816860465116275,
|
|
"grad_norm": 0.5071148846714348,
|
|
"learning_rate": 7.686262760801985e-06,
|
|
"loss": 0.2211,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13151785731315613,
|
|
"step": 3565,
|
|
"valid_targets_mean": 4163.6,
|
|
"valid_targets_min": 1394
|
|
},
|
|
{
|
|
"epoch": 5.188953488372093,
|
|
"grad_norm": 0.5170664010112574,
|
|
"learning_rate": 7.629224554014763e-06,
|
|
"loss": 0.231,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11399704217910767,
|
|
"step": 3570,
|
|
"valid_targets_mean": 3945.2,
|
|
"valid_targets_min": 735
|
|
},
|
|
{
|
|
"epoch": 5.196220930232558,
|
|
"grad_norm": 0.5006143865508161,
|
|
"learning_rate": 7.5723488491070116e-06,
|
|
"loss": 0.2208,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11205872893333435,
|
|
"step": 3575,
|
|
"valid_targets_mean": 4519.0,
|
|
"valid_targets_min": 625
|
|
},
|
|
{
|
|
"epoch": 5.203488372093023,
|
|
"grad_norm": 0.6146302140772092,
|
|
"learning_rate": 7.515636393195129e-06,
|
|
"loss": 0.2126,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10611201822757721,
|
|
"step": 3580,
|
|
"valid_targets_mean": 2733.1,
|
|
"valid_targets_min": 629
|
|
},
|
|
{
|
|
"epoch": 5.210755813953488,
|
|
"grad_norm": 0.5416120670446422,
|
|
"learning_rate": 7.459087931251052e-06,
|
|
"loss": 0.2276,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08908810466527939,
|
|
"step": 3585,
|
|
"valid_targets_mean": 3024.0,
|
|
"valid_targets_min": 780
|
|
},
|
|
{
|
|
"epoch": 5.218023255813954,
|
|
"grad_norm": 0.6388381534227345,
|
|
"learning_rate": 7.402704206092508e-06,
|
|
"loss": 0.2144,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09935657680034637,
|
|
"step": 3590,
|
|
"valid_targets_mean": 2290.0,
|
|
"valid_targets_min": 740
|
|
},
|
|
{
|
|
"epoch": 5.225290697674419,
|
|
"grad_norm": 0.5758476899160144,
|
|
"learning_rate": 7.346485958373266e-06,
|
|
"loss": 0.2218,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11001452803611755,
|
|
"step": 3595,
|
|
"valid_targets_mean": 3376.2,
|
|
"valid_targets_min": 516
|
|
},
|
|
{
|
|
"epoch": 5.232558139534884,
|
|
"grad_norm": 0.5940721029348974,
|
|
"learning_rate": 7.290433926573373e-06,
|
|
"loss": 0.2369,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11747955530881882,
|
|
"step": 3600,
|
|
"valid_targets_mean": 2742.5,
|
|
"valid_targets_min": 774
|
|
},
|
|
{
|
|
"epoch": 5.2398255813953485,
|
|
"grad_norm": 0.7197251133332507,
|
|
"learning_rate": 7.234548846989478e-06,
|
|
"loss": 0.2232,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09308021515607834,
|
|
"step": 3605,
|
|
"valid_targets_mean": 2550.1,
|
|
"valid_targets_min": 467
|
|
},
|
|
{
|
|
"epoch": 5.247093023255814,
|
|
"grad_norm": 0.5111088589057889,
|
|
"learning_rate": 7.17883145372515e-06,
|
|
"loss": 0.2318,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1333235502243042,
|
|
"step": 3610,
|
|
"valid_targets_mean": 4213.5,
|
|
"valid_targets_min": 628
|
|
},
|
|
{
|
|
"epoch": 5.254360465116279,
|
|
"grad_norm": 0.5399044782488424,
|
|
"learning_rate": 7.123282478681255e-06,
|
|
"loss": 0.2341,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12484262883663177,
|
|
"step": 3615,
|
|
"valid_targets_mean": 3860.6,
|
|
"valid_targets_min": 982
|
|
},
|
|
{
|
|
"epoch": 5.261627906976744,
|
|
"grad_norm": 0.6089362087155372,
|
|
"learning_rate": 7.06790265154631e-06,
|
|
"loss": 0.2314,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09410004317760468,
|
|
"step": 3620,
|
|
"valid_targets_mean": 2744.4,
|
|
"valid_targets_min": 727
|
|
},
|
|
{
|
|
"epoch": 5.2688953488372094,
|
|
"grad_norm": 0.4993540684053602,
|
|
"learning_rate": 7.012692699786918e-06,
|
|
"loss": 0.211,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12370635569095612,
|
|
"step": 3625,
|
|
"valid_targets_mean": 4632.6,
|
|
"valid_targets_min": 716
|
|
},
|
|
{
|
|
"epoch": 5.276162790697675,
|
|
"grad_norm": 0.5038961889630662,
|
|
"learning_rate": 6.9576533486382004e-06,
|
|
"loss": 0.233,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11674419045448303,
|
|
"step": 3630,
|
|
"valid_targets_mean": 4505.5,
|
|
"valid_targets_min": 942
|
|
},
|
|
{
|
|
"epoch": 5.28343023255814,
|
|
"grad_norm": 0.46578591540410913,
|
|
"learning_rate": 6.902785321094301e-06,
|
|
"loss": 0.2186,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09898681193590164,
|
|
"step": 3635,
|
|
"valid_targets_mean": 4460.9,
|
|
"valid_targets_min": 301
|
|
},
|
|
{
|
|
"epoch": 5.290697674418604,
|
|
"grad_norm": 0.5426836571471386,
|
|
"learning_rate": 6.84808933789884e-06,
|
|
"loss": 0.2314,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11427856236696243,
|
|
"step": 3640,
|
|
"valid_targets_mean": 4147.2,
|
|
"valid_targets_min": 660
|
|
},
|
|
{
|
|
"epoch": 5.2979651162790695,
|
|
"grad_norm": 0.5289085011659265,
|
|
"learning_rate": 6.793566117535475e-06,
|
|
"loss": 0.2234,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1171591728925705,
|
|
"step": 3645,
|
|
"valid_targets_mean": 3967.5,
|
|
"valid_targets_min": 832
|
|
},
|
|
{
|
|
"epoch": 5.305232558139535,
|
|
"grad_norm": 0.5842762111741557,
|
|
"learning_rate": 6.739216376218483e-06,
|
|
"loss": 0.2258,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1301005482673645,
|
|
"step": 3650,
|
|
"valid_targets_mean": 3883.5,
|
|
"valid_targets_min": 717
|
|
},
|
|
{
|
|
"epoch": 5.3125,
|
|
"grad_norm": 0.5229828592303515,
|
|
"learning_rate": 6.6850408278833e-06,
|
|
"loss": 0.2309,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10519362986087799,
|
|
"step": 3655,
|
|
"valid_targets_mean": 3604.9,
|
|
"valid_targets_min": 914
|
|
},
|
|
{
|
|
"epoch": 5.319767441860465,
|
|
"grad_norm": 0.5537040247119486,
|
|
"learning_rate": 6.631040184177191e-06,
|
|
"loss": 0.2197,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1311875283718109,
|
|
"step": 3660,
|
|
"valid_targets_mean": 3819.0,
|
|
"valid_targets_min": 508
|
|
},
|
|
{
|
|
"epoch": 5.3270348837209305,
|
|
"grad_norm": 0.5061352169459574,
|
|
"learning_rate": 6.577215154449863e-06,
|
|
"loss": 0.2209,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09532980620861053,
|
|
"step": 3665,
|
|
"valid_targets_mean": 3654.8,
|
|
"valid_targets_min": 729
|
|
},
|
|
{
|
|
"epoch": 5.334302325581396,
|
|
"grad_norm": 0.45550595784330383,
|
|
"learning_rate": 6.523566445744196e-06,
|
|
"loss": 0.2327,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09947185218334198,
|
|
"step": 3670,
|
|
"valid_targets_mean": 4620.1,
|
|
"valid_targets_min": 801
|
|
},
|
|
{
|
|
"epoch": 5.34156976744186,
|
|
"grad_norm": 0.5885273568890355,
|
|
"learning_rate": 6.470094762786901e-06,
|
|
"loss": 0.2177,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12775710225105286,
|
|
"step": 3675,
|
|
"valid_targets_mean": 3814.5,
|
|
"valid_targets_min": 792
|
|
},
|
|
{
|
|
"epoch": 5.348837209302325,
|
|
"grad_norm": 0.5972530769456403,
|
|
"learning_rate": 6.4168008079792906e-06,
|
|
"loss": 0.2245,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08653900772333145,
|
|
"step": 3680,
|
|
"valid_targets_mean": 2589.9,
|
|
"valid_targets_min": 509
|
|
},
|
|
{
|
|
"epoch": 5.3561046511627906,
|
|
"grad_norm": 0.489387591827279,
|
|
"learning_rate": 6.36368528138807e-06,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.130646213889122,
|
|
"step": 3685,
|
|
"valid_targets_mean": 4938.5,
|
|
"valid_targets_min": 984
|
|
},
|
|
{
|
|
"epoch": 5.363372093023256,
|
|
"grad_norm": 0.6170411592431482,
|
|
"learning_rate": 6.310748880736095e-06,
|
|
"loss": 0.2267,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09561936557292938,
|
|
"step": 3690,
|
|
"valid_targets_mean": 3151.4,
|
|
"valid_targets_min": 638
|
|
},
|
|
{
|
|
"epoch": 5.370639534883721,
|
|
"grad_norm": 0.5081130790237884,
|
|
"learning_rate": 6.2579923013932435e-06,
|
|
"loss": 0.2228,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1221495121717453,
|
|
"step": 3695,
|
|
"valid_targets_mean": 4372.9,
|
|
"valid_targets_min": 943
|
|
},
|
|
{
|
|
"epoch": 5.377906976744186,
|
|
"grad_norm": 0.6454509271848846,
|
|
"learning_rate": 6.205416236367263e-06,
|
|
"loss": 0.2313,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09919290244579315,
|
|
"step": 3700,
|
|
"valid_targets_mean": 2139.8,
|
|
"valid_targets_min": 495
|
|
},
|
|
{
|
|
"epoch": 5.3851744186046515,
|
|
"grad_norm": 0.557518677664274,
|
|
"learning_rate": 6.1530213762946944e-06,
|
|
"loss": 0.2281,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1259082555770874,
|
|
"step": 3705,
|
|
"valid_targets_mean": 4007.5,
|
|
"valid_targets_min": 745
|
|
},
|
|
{
|
|
"epoch": 5.392441860465116,
|
|
"grad_norm": 0.5793527159329909,
|
|
"learning_rate": 6.100808409431755e-06,
|
|
"loss": 0.2274,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12197981774806976,
|
|
"step": 3710,
|
|
"valid_targets_mean": 3392.2,
|
|
"valid_targets_min": 563
|
|
},
|
|
{
|
|
"epoch": 5.399709302325581,
|
|
"grad_norm": 0.5386985816616846,
|
|
"learning_rate": 6.048778021645329e-06,
|
|
"loss": 0.2131,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10789743065834045,
|
|
"step": 3715,
|
|
"valid_targets_mean": 3452.0,
|
|
"valid_targets_min": 612
|
|
},
|
|
{
|
|
"epoch": 5.406976744186046,
|
|
"grad_norm": 0.621910014250417,
|
|
"learning_rate": 5.996930896403967e-06,
|
|
"loss": 0.2309,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1227702647447586,
|
|
"step": 3720,
|
|
"valid_targets_mean": 3322.1,
|
|
"valid_targets_min": 790
|
|
},
|
|
{
|
|
"epoch": 5.414244186046512,
|
|
"grad_norm": 0.5057315708259351,
|
|
"learning_rate": 5.94526771476887e-06,
|
|
"loss": 0.2224,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10889577120542526,
|
|
"step": 3725,
|
|
"valid_targets_mean": 4153.8,
|
|
"valid_targets_min": 772
|
|
},
|
|
{
|
|
"epoch": 5.421511627906977,
|
|
"grad_norm": 0.5308377606082096,
|
|
"learning_rate": 5.893789155384975e-06,
|
|
"loss": 0.2227,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09790430963039398,
|
|
"step": 3730,
|
|
"valid_targets_mean": 3238.1,
|
|
"valid_targets_min": 778
|
|
},
|
|
{
|
|
"epoch": 5.428779069767442,
|
|
"grad_norm": 0.47748576601578613,
|
|
"learning_rate": 5.8424958944720245e-06,
|
|
"loss": 0.2256,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1386643946170807,
|
|
"step": 3735,
|
|
"valid_targets_mean": 5128.6,
|
|
"valid_targets_min": 392
|
|
},
|
|
{
|
|
"epoch": 5.436046511627907,
|
|
"grad_norm": 0.5129310083697562,
|
|
"learning_rate": 5.791388605815709e-06,
|
|
"loss": 0.2315,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11397480964660645,
|
|
"step": 3740,
|
|
"valid_targets_mean": 4230.2,
|
|
"valid_targets_min": 589
|
|
},
|
|
{
|
|
"epoch": 5.4433139534883725,
|
|
"grad_norm": 0.586622641537686,
|
|
"learning_rate": 5.740467960758776e-06,
|
|
"loss": 0.2164,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13233549892902374,
|
|
"step": 3745,
|
|
"valid_targets_mean": 3652.4,
|
|
"valid_targets_min": 737
|
|
},
|
|
{
|
|
"epoch": 5.450581395348837,
|
|
"grad_norm": 0.47656954097512755,
|
|
"learning_rate": 5.68973462819223e-06,
|
|
"loss": 0.2222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08915632963180542,
|
|
"step": 3750,
|
|
"valid_targets_mean": 4145.4,
|
|
"valid_targets_min": 476
|
|
},
|
|
{
|
|
"epoch": 5.457848837209302,
|
|
"grad_norm": 0.47752527551101914,
|
|
"learning_rate": 5.63918927454657e-06,
|
|
"loss": 0.2219,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08590822666883469,
|
|
"step": 3755,
|
|
"valid_targets_mean": 3623.9,
|
|
"valid_targets_min": 534
|
|
},
|
|
{
|
|
"epoch": 5.465116279069767,
|
|
"grad_norm": 0.6775039949217503,
|
|
"learning_rate": 5.588832563783e-06,
|
|
"loss": 0.2212,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10755671560764313,
|
|
"step": 3760,
|
|
"valid_targets_mean": 1813.9,
|
|
"valid_targets_min": 601
|
|
},
|
|
{
|
|
"epoch": 5.472383720930233,
|
|
"grad_norm": 0.4616676959594202,
|
|
"learning_rate": 5.538665157384715e-06,
|
|
"loss": 0.2249,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11233869940042496,
|
|
"step": 3765,
|
|
"valid_targets_mean": 4682.6,
|
|
"valid_targets_min": 3531
|
|
},
|
|
{
|
|
"epoch": 5.479651162790698,
|
|
"grad_norm": 0.5377360862025549,
|
|
"learning_rate": 5.48868771434822e-06,
|
|
"loss": 0.226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1236083060503006,
|
|
"step": 3770,
|
|
"valid_targets_mean": 3839.6,
|
|
"valid_targets_min": 752
|
|
},
|
|
{
|
|
"epoch": 5.486918604651163,
|
|
"grad_norm": 0.6338269834891624,
|
|
"learning_rate": 5.438900891174686e-06,
|
|
"loss": 0.2369,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13257811963558197,
|
|
"step": 3775,
|
|
"valid_targets_mean": 3260.4,
|
|
"valid_targets_min": 417
|
|
},
|
|
{
|
|
"epoch": 5.4941860465116275,
|
|
"grad_norm": 0.5183978177248446,
|
|
"learning_rate": 5.389305341861293e-06,
|
|
"loss": 0.2369,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10330487787723541,
|
|
"step": 3780,
|
|
"valid_targets_mean": 3676.6,
|
|
"valid_targets_min": 622
|
|
},
|
|
{
|
|
"epoch": 5.501453488372093,
|
|
"grad_norm": 0.5006609696903801,
|
|
"learning_rate": 5.3399017178926614e-06,
|
|
"loss": 0.2198,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09554791450500488,
|
|
"step": 3785,
|
|
"valid_targets_mean": 3681.5,
|
|
"valid_targets_min": 503
|
|
},
|
|
{
|
|
"epoch": 5.508720930232558,
|
|
"grad_norm": 0.5369589728239931,
|
|
"learning_rate": 5.290690668232301e-06,
|
|
"loss": 0.2283,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12455598264932632,
|
|
"step": 3790,
|
|
"valid_targets_mean": 3967.4,
|
|
"valid_targets_min": 822
|
|
},
|
|
{
|
|
"epoch": 5.515988372093023,
|
|
"grad_norm": 0.5412191392066285,
|
|
"learning_rate": 5.2416728393140624e-06,
|
|
"loss": 0.2269,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11805573850870132,
|
|
"step": 3795,
|
|
"valid_targets_mean": 3910.9,
|
|
"valid_targets_min": 611
|
|
},
|
|
{
|
|
"epoch": 5.523255813953488,
|
|
"grad_norm": 0.5237261735625945,
|
|
"learning_rate": 5.192848875033663e-06,
|
|
"loss": 0.2257,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11130371689796448,
|
|
"step": 3800,
|
|
"valid_targets_mean": 3325.5,
|
|
"valid_targets_min": 525
|
|
},
|
|
{
|
|
"epoch": 5.530523255813954,
|
|
"grad_norm": 0.4855369276832591,
|
|
"learning_rate": 5.144219416740217e-06,
|
|
"loss": 0.238,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1295335739850998,
|
|
"step": 3805,
|
|
"valid_targets_mean": 4685.5,
|
|
"valid_targets_min": 916
|
|
},
|
|
{
|
|
"epoch": 5.537790697674419,
|
|
"grad_norm": 0.5357362667911629,
|
|
"learning_rate": 5.095785103227835e-06,
|
|
"loss": 0.222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10563298314809799,
|
|
"step": 3810,
|
|
"valid_targets_mean": 3333.4,
|
|
"valid_targets_min": 459
|
|
},
|
|
{
|
|
"epoch": 5.545058139534884,
|
|
"grad_norm": 0.4783226797446443,
|
|
"learning_rate": 5.047546570727205e-06,
|
|
"loss": 0.2166,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08839955925941467,
|
|
"step": 3815,
|
|
"valid_targets_mean": 3058.4,
|
|
"valid_targets_min": 626
|
|
},
|
|
{
|
|
"epoch": 5.5523255813953485,
|
|
"grad_norm": 0.603397173592423,
|
|
"learning_rate": 4.999504452897232e-06,
|
|
"loss": 0.2208,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14669716358184814,
|
|
"step": 3820,
|
|
"valid_targets_mean": 3794.2,
|
|
"valid_targets_min": 880
|
|
},
|
|
{
|
|
"epoch": 5.559593023255814,
|
|
"grad_norm": 0.5498293837910059,
|
|
"learning_rate": 4.95165938081676e-06,
|
|
"loss": 0.2301,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15765151381492615,
|
|
"step": 3825,
|
|
"valid_targets_mean": 3928.4,
|
|
"valid_targets_min": 685
|
|
},
|
|
{
|
|
"epoch": 5.566860465116279,
|
|
"grad_norm": 0.5075169876722437,
|
|
"learning_rate": 4.9040119829762246e-06,
|
|
"loss": 0.2317,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12888945639133453,
|
|
"step": 3830,
|
|
"valid_targets_mean": 4282.1,
|
|
"valid_targets_min": 800
|
|
},
|
|
{
|
|
"epoch": 5.574127906976744,
|
|
"grad_norm": 0.553383225462878,
|
|
"learning_rate": 4.856562885269427e-06,
|
|
"loss": 0.2166,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10596640408039093,
|
|
"step": 3835,
|
|
"valid_targets_mean": 2909.5,
|
|
"valid_targets_min": 619
|
|
},
|
|
{
|
|
"epoch": 5.5813953488372094,
|
|
"grad_norm": 0.7686235169257939,
|
|
"learning_rate": 4.809312710985308e-06,
|
|
"loss": 0.2366,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.17210009694099426,
|
|
"step": 3840,
|
|
"valid_targets_mean": 2873.5,
|
|
"valid_targets_min": 484
|
|
},
|
|
{
|
|
"epoch": 5.588662790697675,
|
|
"grad_norm": 0.554861312349065,
|
|
"learning_rate": 4.762262080799771e-06,
|
|
"loss": 0.2396,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13465741276741028,
|
|
"step": 3845,
|
|
"valid_targets_mean": 4018.6,
|
|
"valid_targets_min": 735
|
|
},
|
|
{
|
|
"epoch": 5.595930232558139,
|
|
"grad_norm": 0.46848899820454354,
|
|
"learning_rate": 4.715411612767508e-06,
|
|
"loss": 0.2127,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11969712376594543,
|
|
"step": 3850,
|
|
"valid_targets_mean": 4644.1,
|
|
"valid_targets_min": 3761
|
|
},
|
|
{
|
|
"epoch": 5.603197674418604,
|
|
"grad_norm": 0.46405211577543315,
|
|
"learning_rate": 4.668761922313893e-06,
|
|
"loss": 0.2235,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09280385076999664,
|
|
"step": 3855,
|
|
"valid_targets_mean": 3501.6,
|
|
"valid_targets_min": 602
|
|
},
|
|
{
|
|
"epoch": 5.6104651162790695,
|
|
"grad_norm": 0.5308472326139155,
|
|
"learning_rate": 4.622313622226888e-06,
|
|
"loss": 0.2248,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0978182926774025,
|
|
"step": 3860,
|
|
"valid_targets_mean": 3168.2,
|
|
"valid_targets_min": 246
|
|
},
|
|
{
|
|
"epoch": 5.617732558139535,
|
|
"grad_norm": 0.5701733988373806,
|
|
"learning_rate": 4.5760673226490245e-06,
|
|
"loss": 0.2391,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09062608331441879,
|
|
"step": 3865,
|
|
"valid_targets_mean": 2962.1,
|
|
"valid_targets_min": 506
|
|
},
|
|
{
|
|
"epoch": 5.625,
|
|
"grad_norm": 0.5600910428886875,
|
|
"learning_rate": 4.530023631069342e-06,
|
|
"loss": 0.2326,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.112250916659832,
|
|
"step": 3870,
|
|
"valid_targets_mean": 3511.9,
|
|
"valid_targets_min": 781
|
|
},
|
|
{
|
|
"epoch": 5.632267441860465,
|
|
"grad_norm": 0.4847013463582278,
|
|
"learning_rate": 4.484183152315435e-06,
|
|
"loss": 0.2223,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.131978377699852,
|
|
"step": 3875,
|
|
"valid_targets_mean": 5273.6,
|
|
"valid_targets_min": 735
|
|
},
|
|
{
|
|
"epoch": 5.6395348837209305,
|
|
"grad_norm": 0.5504896810558689,
|
|
"learning_rate": 4.438546488545516e-06,
|
|
"loss": 0.2206,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08465667814016342,
|
|
"step": 3880,
|
|
"valid_targets_mean": 2705.5,
|
|
"valid_targets_min": 550
|
|
},
|
|
{
|
|
"epoch": 5.646802325581396,
|
|
"grad_norm": 0.4930889515925386,
|
|
"learning_rate": 4.393114239240495e-06,
|
|
"loss": 0.2206,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09775549173355103,
|
|
"step": 3885,
|
|
"valid_targets_mean": 3736.1,
|
|
"valid_targets_min": 486
|
|
},
|
|
{
|
|
"epoch": 5.654069767441861,
|
|
"grad_norm": 0.6661086629183974,
|
|
"learning_rate": 4.347887001196089e-06,
|
|
"loss": 0.2185,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13360783457756042,
|
|
"step": 3890,
|
|
"valid_targets_mean": 2850.1,
|
|
"valid_targets_min": 447
|
|
},
|
|
{
|
|
"epoch": 5.661337209302325,
|
|
"grad_norm": 0.49494538033843166,
|
|
"learning_rate": 4.302865368515002e-06,
|
|
"loss": 0.215,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11445395648479462,
|
|
"step": 3895,
|
|
"valid_targets_mean": 3998.5,
|
|
"valid_targets_min": 634
|
|
},
|
|
{
|
|
"epoch": 5.6686046511627906,
|
|
"grad_norm": 0.5172249268234121,
|
|
"learning_rate": 4.2580499325991284e-06,
|
|
"loss": 0.2277,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12026748061180115,
|
|
"step": 3900,
|
|
"valid_targets_mean": 4291.1,
|
|
"valid_targets_min": 1215
|
|
},
|
|
{
|
|
"epoch": 5.675872093023256,
|
|
"grad_norm": 0.584906298842366,
|
|
"learning_rate": 4.213441282141762e-06,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10975706577301025,
|
|
"step": 3905,
|
|
"valid_targets_mean": 3372.2,
|
|
"valid_targets_min": 707
|
|
},
|
|
{
|
|
"epoch": 5.683139534883721,
|
|
"grad_norm": 0.4644507284510041,
|
|
"learning_rate": 4.169040003119871e-06,
|
|
"loss": 0.2297,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12260288000106812,
|
|
"step": 3910,
|
|
"valid_targets_mean": 5018.1,
|
|
"valid_targets_min": 2599
|
|
},
|
|
{
|
|
"epoch": 5.690406976744186,
|
|
"grad_norm": 0.4916359177514743,
|
|
"learning_rate": 4.124846678786405e-06,
|
|
"loss": 0.2212,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1183990091085434,
|
|
"step": 3915,
|
|
"valid_targets_mean": 4028.6,
|
|
"valid_targets_min": 737
|
|
},
|
|
{
|
|
"epoch": 5.6976744186046515,
|
|
"grad_norm": 0.5389463683484641,
|
|
"learning_rate": 4.080861889662642e-06,
|
|
"loss": 0.2324,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14097467064857483,
|
|
"step": 3920,
|
|
"valid_targets_mean": 4007.8,
|
|
"valid_targets_min": 745
|
|
},
|
|
{
|
|
"epoch": 5.704941860465116,
|
|
"grad_norm": 0.5394672937113356,
|
|
"learning_rate": 4.037086213530539e-06,
|
|
"loss": 0.2401,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1080642119050026,
|
|
"step": 3925,
|
|
"valid_targets_mean": 3299.9,
|
|
"valid_targets_min": 431
|
|
},
|
|
{
|
|
"epoch": 5.712209302325581,
|
|
"grad_norm": 0.5031746817464193,
|
|
"learning_rate": 3.993520225425154e-06,
|
|
"loss": 0.235,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09760770946741104,
|
|
"step": 3930,
|
|
"valid_targets_mean": 3632.9,
|
|
"valid_targets_min": 567
|
|
},
|
|
{
|
|
"epoch": 5.719476744186046,
|
|
"grad_norm": 0.5497879839779796,
|
|
"learning_rate": 3.9501644976271095e-06,
|
|
"loss": 0.2258,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11778296530246735,
|
|
"step": 3935,
|
|
"valid_targets_mean": 4291.6,
|
|
"valid_targets_min": 572
|
|
},
|
|
{
|
|
"epoch": 5.726744186046512,
|
|
"grad_norm": 0.4776129835677131,
|
|
"learning_rate": 3.907019599655044e-06,
|
|
"loss": 0.2205,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10025591403245926,
|
|
"step": 3940,
|
|
"valid_targets_mean": 4037.6,
|
|
"valid_targets_min": 736
|
|
},
|
|
{
|
|
"epoch": 5.734011627906977,
|
|
"grad_norm": 0.5246341815995155,
|
|
"learning_rate": 3.864086098258153e-06,
|
|
"loss": 0.2239,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12622231245040894,
|
|
"step": 3945,
|
|
"valid_targets_mean": 3679.9,
|
|
"valid_targets_min": 607
|
|
},
|
|
{
|
|
"epoch": 5.741279069767442,
|
|
"grad_norm": 0.6086055176247579,
|
|
"learning_rate": 3.8213645574087286e-06,
|
|
"loss": 0.2194,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10311783850193024,
|
|
"step": 3950,
|
|
"valid_targets_mean": 2590.5,
|
|
"valid_targets_min": 633
|
|
},
|
|
{
|
|
"epoch": 5.748546511627907,
|
|
"grad_norm": 0.45195401508843,
|
|
"learning_rate": 3.778855538294779e-06,
|
|
"loss": 0.2226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09347233176231384,
|
|
"step": 3955,
|
|
"valid_targets_mean": 4437.8,
|
|
"valid_targets_min": 607
|
|
},
|
|
{
|
|
"epoch": 5.7558139534883725,
|
|
"grad_norm": 0.6060623213653233,
|
|
"learning_rate": 3.736559599312619e-06,
|
|
"loss": 0.227,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11307326704263687,
|
|
"step": 3960,
|
|
"valid_targets_mean": 3571.6,
|
|
"valid_targets_min": 785
|
|
},
|
|
{
|
|
"epoch": 5.763081395348837,
|
|
"grad_norm": 0.5002442442836875,
|
|
"learning_rate": 3.6944772960595597e-06,
|
|
"loss": 0.2268,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1352311074733734,
|
|
"step": 3965,
|
|
"valid_targets_mean": 5457.2,
|
|
"valid_targets_min": 3562
|
|
},
|
|
{
|
|
"epoch": 5.770348837209302,
|
|
"grad_norm": 0.5754115654946838,
|
|
"learning_rate": 3.652609181326601e-06,
|
|
"loss": 0.2338,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12333385646343231,
|
|
"step": 3970,
|
|
"valid_targets_mean": 3621.1,
|
|
"valid_targets_min": 647
|
|
},
|
|
{
|
|
"epoch": 5.777616279069767,
|
|
"grad_norm": 0.5231121941154192,
|
|
"learning_rate": 3.610955805091185e-06,
|
|
"loss": 0.217,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09638865292072296,
|
|
"step": 3975,
|
|
"valid_targets_mean": 3402.5,
|
|
"valid_targets_min": 776
|
|
},
|
|
{
|
|
"epoch": 5.784883720930233,
|
|
"grad_norm": 0.5508341437323052,
|
|
"learning_rate": 3.569517714509947e-06,
|
|
"loss": 0.2204,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13687901198863983,
|
|
"step": 3980,
|
|
"valid_targets_mean": 4811.4,
|
|
"valid_targets_min": 4256
|
|
},
|
|
{
|
|
"epoch": 5.792151162790698,
|
|
"grad_norm": 0.5254922241131528,
|
|
"learning_rate": 3.528295453911541e-06,
|
|
"loss": 0.2307,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1139884814620018,
|
|
"step": 3985,
|
|
"valid_targets_mean": 3759.5,
|
|
"valid_targets_min": 676
|
|
},
|
|
{
|
|
"epoch": 5.799418604651163,
|
|
"grad_norm": 0.6129810405498609,
|
|
"learning_rate": 3.4872895647895045e-06,
|
|
"loss": 0.229,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12669987976551056,
|
|
"step": 3990,
|
|
"valid_targets_mean": 3018.9,
|
|
"valid_targets_min": 432
|
|
},
|
|
{
|
|
"epoch": 5.8066860465116275,
|
|
"grad_norm": 0.5650351578983417,
|
|
"learning_rate": 3.446500585795112e-06,
|
|
"loss": 0.2182,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1187901720404625,
|
|
"step": 3995,
|
|
"valid_targets_mean": 3951.6,
|
|
"valid_targets_min": 532
|
|
},
|
|
{
|
|
"epoch": 5.813953488372093,
|
|
"grad_norm": 0.5922160583846725,
|
|
"learning_rate": 3.4059290527303256e-06,
|
|
"loss": 0.2414,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0975690633058548,
|
|
"step": 4000,
|
|
"valid_targets_mean": 2933.4,
|
|
"valid_targets_min": 543
|
|
},
|
|
{
|
|
"epoch": 5.821220930232558,
|
|
"grad_norm": 0.5524185962304792,
|
|
"learning_rate": 3.3655754985407453e-06,
|
|
"loss": 0.2335,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.144732266664505,
|
|
"step": 4005,
|
|
"valid_targets_mean": 4334.1,
|
|
"valid_targets_min": 699
|
|
},
|
|
{
|
|
"epoch": 5.828488372093023,
|
|
"grad_norm": 0.554719491811411,
|
|
"learning_rate": 3.3254404533086216e-06,
|
|
"loss": 0.2248,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11786288022994995,
|
|
"step": 4010,
|
|
"valid_targets_mean": 3635.6,
|
|
"valid_targets_min": 883
|
|
},
|
|
{
|
|
"epoch": 5.835755813953488,
|
|
"grad_norm": 0.525008145807584,
|
|
"learning_rate": 3.285524444245873e-06,
|
|
"loss": 0.2373,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13068491220474243,
|
|
"step": 4015,
|
|
"valid_targets_mean": 4179.9,
|
|
"valid_targets_min": 887
|
|
},
|
|
{
|
|
"epoch": 5.843023255813954,
|
|
"grad_norm": 0.5177901449861642,
|
|
"learning_rate": 3.245827995687165e-06,
|
|
"loss": 0.2215,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1204511895775795,
|
|
"step": 4020,
|
|
"valid_targets_mean": 4649.1,
|
|
"valid_targets_min": 796
|
|
},
|
|
{
|
|
"epoch": 5.850290697674419,
|
|
"grad_norm": 0.5388393937448382,
|
|
"learning_rate": 3.2063516290830445e-06,
|
|
"loss": 0.2311,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13081350922584534,
|
|
"step": 4025,
|
|
"valid_targets_mean": 4260.2,
|
|
"valid_targets_min": 870
|
|
},
|
|
{
|
|
"epoch": 5.857558139534884,
|
|
"grad_norm": 0.5869572044002439,
|
|
"learning_rate": 3.1670958629930595e-06,
|
|
"loss": 0.2328,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09571430832147598,
|
|
"step": 4030,
|
|
"valid_targets_mean": 1790.9,
|
|
"valid_targets_min": 200
|
|
},
|
|
{
|
|
"epoch": 5.8648255813953485,
|
|
"grad_norm": 0.5432452195757204,
|
|
"learning_rate": 3.1280612130789633e-06,
|
|
"loss": 0.227,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.15068915486335754,
|
|
"step": 4035,
|
|
"valid_targets_mean": 4574.0,
|
|
"valid_targets_min": 629
|
|
},
|
|
{
|
|
"epoch": 5.872093023255814,
|
|
"grad_norm": 0.541853575741418,
|
|
"learning_rate": 3.0892481920979355e-06,
|
|
"loss": 0.2216,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11317667365074158,
|
|
"step": 4040,
|
|
"valid_targets_mean": 3943.2,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 5.879360465116279,
|
|
"grad_norm": 0.5979049468845229,
|
|
"learning_rate": 3.0506573098958613e-06,
|
|
"loss": 0.2299,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10876569151878357,
|
|
"step": 4045,
|
|
"valid_targets_mean": 3525.4,
|
|
"valid_targets_min": 555
|
|
},
|
|
{
|
|
"epoch": 5.886627906976744,
|
|
"grad_norm": 0.5448360093244398,
|
|
"learning_rate": 3.0122890734006114e-06,
|
|
"loss": 0.222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09871428459882736,
|
|
"step": 4050,
|
|
"valid_targets_mean": 3317.1,
|
|
"valid_targets_min": 615
|
|
},
|
|
{
|
|
"epoch": 5.8938953488372094,
|
|
"grad_norm": 0.5699959641756522,
|
|
"learning_rate": 2.97414398661539e-06,
|
|
"loss": 0.2246,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10872367769479752,
|
|
"step": 4055,
|
|
"valid_targets_mean": 3118.6,
|
|
"valid_targets_min": 632
|
|
},
|
|
{
|
|
"epoch": 5.901162790697675,
|
|
"grad_norm": 0.4759006211842608,
|
|
"learning_rate": 2.9362225506121357e-06,
|
|
"loss": 0.2167,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08648262172937393,
|
|
"step": 4060,
|
|
"valid_targets_mean": 3458.9,
|
|
"valid_targets_min": 591
|
|
},
|
|
{
|
|
"epoch": 5.908430232558139,
|
|
"grad_norm": 0.5187120792922781,
|
|
"learning_rate": 2.8985252635249026e-06,
|
|
"loss": 0.2189,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13931739330291748,
|
|
"step": 4065,
|
|
"valid_targets_mean": 4865.6,
|
|
"valid_targets_min": 690
|
|
},
|
|
{
|
|
"epoch": 5.915697674418604,
|
|
"grad_norm": 0.44646041509070417,
|
|
"learning_rate": 2.8610526205433476e-06,
|
|
"loss": 0.2314,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1304367482662201,
|
|
"step": 4070,
|
|
"valid_targets_mean": 5352.8,
|
|
"valid_targets_min": 4351
|
|
},
|
|
{
|
|
"epoch": 5.9229651162790695,
|
|
"grad_norm": 0.5127187092080205,
|
|
"learning_rate": 2.823805113906204e-06,
|
|
"loss": 0.218,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1429927945137024,
|
|
"step": 4075,
|
|
"valid_targets_mean": 4904.5,
|
|
"valid_targets_min": 3744
|
|
},
|
|
{
|
|
"epoch": 5.930232558139535,
|
|
"grad_norm": 0.5192855903363226,
|
|
"learning_rate": 2.7867832328948385e-06,
|
|
"loss": 0.2138,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.090521439909935,
|
|
"step": 4080,
|
|
"valid_targets_mean": 3285.5,
|
|
"valid_targets_min": 633
|
|
},
|
|
{
|
|
"epoch": 5.9375,
|
|
"grad_norm": 0.4794115204926523,
|
|
"learning_rate": 2.7499874638268044e-06,
|
|
"loss": 0.2265,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12026579678058624,
|
|
"step": 4085,
|
|
"valid_targets_mean": 5181.1,
|
|
"valid_targets_min": 3352
|
|
},
|
|
{
|
|
"epoch": 5.944767441860465,
|
|
"grad_norm": 0.5009908186316896,
|
|
"learning_rate": 2.7134182900494542e-06,
|
|
"loss": 0.2314,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09819701313972473,
|
|
"step": 4090,
|
|
"valid_targets_mean": 3623.4,
|
|
"valid_targets_min": 578
|
|
},
|
|
{
|
|
"epoch": 5.9520348837209305,
|
|
"grad_norm": 0.456827041300496,
|
|
"learning_rate": 2.6770761919336098e-06,
|
|
"loss": 0.2226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11058850586414337,
|
|
"step": 4095,
|
|
"valid_targets_mean": 4412.2,
|
|
"valid_targets_min": 3777
|
|
},
|
|
{
|
|
"epoch": 5.959302325581396,
|
|
"grad_norm": 0.5665319932821282,
|
|
"learning_rate": 2.640961646867224e-06,
|
|
"loss": 0.2412,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0975506603717804,
|
|
"step": 4100,
|
|
"valid_targets_mean": 3505.1,
|
|
"valid_targets_min": 734
|
|
},
|
|
{
|
|
"epoch": 5.966569767441861,
|
|
"grad_norm": 0.5428484473133973,
|
|
"learning_rate": 2.605075129249135e-06,
|
|
"loss": 0.2221,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1216345876455307,
|
|
"step": 4105,
|
|
"valid_targets_mean": 4187.2,
|
|
"valid_targets_min": 608
|
|
},
|
|
{
|
|
"epoch": 5.973837209302325,
|
|
"grad_norm": 0.6032813933057201,
|
|
"learning_rate": 2.5694171104828146e-06,
|
|
"loss": 0.2253,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10044913738965988,
|
|
"step": 4110,
|
|
"valid_targets_mean": 2797.5,
|
|
"valid_targets_min": 844
|
|
},
|
|
{
|
|
"epoch": 5.9811046511627906,
|
|
"grad_norm": 0.5147925778815827,
|
|
"learning_rate": 2.533988058970198e-06,
|
|
"loss": 0.2212,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10603871941566467,
|
|
"step": 4115,
|
|
"valid_targets_mean": 3845.6,
|
|
"valid_targets_min": 584
|
|
},
|
|
{
|
|
"epoch": 5.988372093023256,
|
|
"grad_norm": 0.5327598308654197,
|
|
"learning_rate": 2.498788440105506e-06,
|
|
"loss": 0.224,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11044016480445862,
|
|
"step": 4120,
|
|
"valid_targets_mean": 4463.9,
|
|
"valid_targets_min": 807
|
|
},
|
|
{
|
|
"epoch": 5.995639534883721,
|
|
"grad_norm": 0.5854269304654619,
|
|
"learning_rate": 2.4638187162691487e-06,
|
|
"loss": 0.2239,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12129954993724823,
|
|
"step": 4125,
|
|
"valid_targets_mean": 3566.0,
|
|
"valid_targets_min": 512
|
|
},
|
|
{
|
|
"epoch": 6.002906976744186,
|
|
"grad_norm": 0.5313957720724034,
|
|
"learning_rate": 2.42907934682165e-06,
|
|
"loss": 0.2187,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1027924120426178,
|
|
"step": 4130,
|
|
"valid_targets_mean": 3559.5,
|
|
"valid_targets_min": 612
|
|
},
|
|
{
|
|
"epoch": 6.0101744186046515,
|
|
"grad_norm": 0.5483117826436876,
|
|
"learning_rate": 2.3945707880976034e-06,
|
|
"loss": 0.218,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13372516632080078,
|
|
"step": 4135,
|
|
"valid_targets_mean": 5047.0,
|
|
"valid_targets_min": 631
|
|
},
|
|
{
|
|
"epoch": 6.017441860465116,
|
|
"grad_norm": 0.5090642043437736,
|
|
"learning_rate": 2.36029349339969e-06,
|
|
"loss": 0.2308,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10333339869976044,
|
|
"step": 4140,
|
|
"valid_targets_mean": 3638.2,
|
|
"valid_targets_min": 698
|
|
},
|
|
{
|
|
"epoch": 6.024709302325581,
|
|
"grad_norm": 0.5066239118036157,
|
|
"learning_rate": 2.3262479129927116e-06,
|
|
"loss": 0.2236,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11342179775238037,
|
|
"step": 4145,
|
|
"valid_targets_mean": 4146.6,
|
|
"valid_targets_min": 657
|
|
},
|
|
{
|
|
"epoch": 6.031976744186046,
|
|
"grad_norm": 0.48087895739663883,
|
|
"learning_rate": 2.2924344940976975e-06,
|
|
"loss": 0.2211,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09436848759651184,
|
|
"step": 4150,
|
|
"valid_targets_mean": 3816.1,
|
|
"valid_targets_min": 666
|
|
},
|
|
{
|
|
"epoch": 6.039244186046512,
|
|
"grad_norm": 0.5537030876418265,
|
|
"learning_rate": 2.2588536808859975e-06,
|
|
"loss": 0.2125,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11316031217575073,
|
|
"step": 4155,
|
|
"valid_targets_mean": 4260.8,
|
|
"valid_targets_min": 727
|
|
},
|
|
{
|
|
"epoch": 6.046511627906977,
|
|
"grad_norm": 0.5833788098367146,
|
|
"learning_rate": 2.225505914473469e-06,
|
|
"loss": 0.2101,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12212025374174118,
|
|
"step": 4160,
|
|
"valid_targets_mean": 3621.4,
|
|
"valid_targets_min": 572
|
|
},
|
|
{
|
|
"epoch": 6.053779069767442,
|
|
"grad_norm": 0.7362174701066857,
|
|
"learning_rate": 2.19239163291469e-06,
|
|
"loss": 0.2182,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09100019931793213,
|
|
"step": 4165,
|
|
"valid_targets_mean": 3448.5,
|
|
"valid_targets_min": 667
|
|
},
|
|
{
|
|
"epoch": 6.061046511627907,
|
|
"grad_norm": 0.4740406178811528,
|
|
"learning_rate": 2.1595112711971835e-06,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09100145101547241,
|
|
"step": 4170,
|
|
"valid_targets_mean": 4132.0,
|
|
"valid_targets_min": 722
|
|
},
|
|
{
|
|
"epoch": 6.068313953488372,
|
|
"grad_norm": 0.6161720448401335,
|
|
"learning_rate": 2.1268652612357153e-06,
|
|
"loss": 0.2347,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13534143567085266,
|
|
"step": 4175,
|
|
"valid_targets_mean": 3147.4,
|
|
"valid_targets_min": 602
|
|
},
|
|
{
|
|
"epoch": 6.075581395348837,
|
|
"grad_norm": 0.5205546045427543,
|
|
"learning_rate": 2.0944540318666107e-06,
|
|
"loss": 0.2093,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1053255945444107,
|
|
"step": 4180,
|
|
"valid_targets_mean": 3569.5,
|
|
"valid_targets_min": 524
|
|
},
|
|
{
|
|
"epoch": 6.082848837209302,
|
|
"grad_norm": 0.6116553776699947,
|
|
"learning_rate": 2.062278008842147e-06,
|
|
"loss": 0.2354,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09495720267295837,
|
|
"step": 4185,
|
|
"valid_targets_mean": 2838.4,
|
|
"valid_targets_min": 591
|
|
},
|
|
{
|
|
"epoch": 6.090116279069767,
|
|
"grad_norm": 0.5276279180760463,
|
|
"learning_rate": 2.030337614824929e-06,
|
|
"loss": 0.2242,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11515341699123383,
|
|
"step": 4190,
|
|
"valid_targets_mean": 3900.5,
|
|
"valid_targets_min": 548
|
|
},
|
|
{
|
|
"epoch": 6.097383720930233,
|
|
"grad_norm": 0.5208050337446745,
|
|
"learning_rate": 1.9986332693823487e-06,
|
|
"loss": 0.2206,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.07439148426055908,
|
|
"step": 4195,
|
|
"valid_targets_mean": 2552.5,
|
|
"valid_targets_min": 582
|
|
},
|
|
{
|
|
"epoch": 6.104651162790698,
|
|
"grad_norm": 0.5694598831791498,
|
|
"learning_rate": 1.9671653889810893e-06,
|
|
"loss": 0.2212,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09752744436264038,
|
|
"step": 4200,
|
|
"valid_targets_mean": 3513.8,
|
|
"valid_targets_min": 583
|
|
},
|
|
{
|
|
"epoch": 6.111918604651163,
|
|
"grad_norm": 0.49122429844668036,
|
|
"learning_rate": 1.9359343869816307e-06,
|
|
"loss": 0.2173,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10171881318092346,
|
|
"step": 4205,
|
|
"valid_targets_mean": 3564.2,
|
|
"valid_targets_min": 707
|
|
},
|
|
{
|
|
"epoch": 6.119186046511628,
|
|
"grad_norm": 0.5429562792251613,
|
|
"learning_rate": 1.9049406736328336e-06,
|
|
"loss": 0.2119,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1320454478263855,
|
|
"step": 4210,
|
|
"valid_targets_mean": 3916.1,
|
|
"valid_targets_min": 882
|
|
},
|
|
{
|
|
"epoch": 6.126453488372093,
|
|
"grad_norm": 0.5930470816888453,
|
|
"learning_rate": 1.87418465606654e-06,
|
|
"loss": 0.2188,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.115715891122818,
|
|
"step": 4215,
|
|
"valid_targets_mean": 3784.2,
|
|
"valid_targets_min": 652
|
|
},
|
|
{
|
|
"epoch": 6.133720930232558,
|
|
"grad_norm": 0.4980643141344037,
|
|
"learning_rate": 1.8436667382922468e-06,
|
|
"loss": 0.2197,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11309342831373215,
|
|
"step": 4220,
|
|
"valid_targets_mean": 4678.9,
|
|
"valid_targets_min": 1008
|
|
},
|
|
{
|
|
"epoch": 6.140988372093023,
|
|
"grad_norm": 0.5369540725587354,
|
|
"learning_rate": 1.8133873211917686e-06,
|
|
"loss": 0.2214,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11754552274942398,
|
|
"step": 4225,
|
|
"valid_targets_mean": 4220.1,
|
|
"valid_targets_min": 1120
|
|
},
|
|
{
|
|
"epoch": 6.148255813953488,
|
|
"grad_norm": 0.5125697181326947,
|
|
"learning_rate": 1.783346802514001e-06,
|
|
"loss": 0.2334,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10513949394226074,
|
|
"step": 4230,
|
|
"valid_targets_mean": 3621.4,
|
|
"valid_targets_min": 642
|
|
},
|
|
{
|
|
"epoch": 6.155523255813954,
|
|
"grad_norm": 0.5837456425846023,
|
|
"learning_rate": 1.7535455768696686e-06,
|
|
"loss": 0.2243,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1067032665014267,
|
|
"step": 4235,
|
|
"valid_targets_mean": 3622.5,
|
|
"valid_targets_min": 537
|
|
},
|
|
{
|
|
"epoch": 6.162790697674419,
|
|
"grad_norm": 0.6370646912449455,
|
|
"learning_rate": 1.7239840357261695e-06,
|
|
"loss": 0.2234,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10105766355991364,
|
|
"step": 4240,
|
|
"valid_targets_mean": 2271.6,
|
|
"valid_targets_min": 684
|
|
},
|
|
{
|
|
"epoch": 6.170058139534884,
|
|
"grad_norm": 0.6028206483589204,
|
|
"learning_rate": 1.6946625674024053e-06,
|
|
"loss": 0.2216,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12402664870023727,
|
|
"step": 4245,
|
|
"valid_targets_mean": 3750.8,
|
|
"valid_targets_min": 635
|
|
},
|
|
{
|
|
"epoch": 6.1773255813953485,
|
|
"grad_norm": 0.48050804435313044,
|
|
"learning_rate": 1.6655815570637002e-06,
|
|
"loss": 0.2249,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13276661932468414,
|
|
"step": 4250,
|
|
"valid_targets_mean": 5509.6,
|
|
"valid_targets_min": 3861
|
|
},
|
|
{
|
|
"epoch": 6.184593023255814,
|
|
"grad_norm": 0.5069577336702119,
|
|
"learning_rate": 1.636741386716727e-06,
|
|
"loss": 0.2216,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10672836005687714,
|
|
"step": 4255,
|
|
"valid_targets_mean": 3849.8,
|
|
"valid_targets_min": 559
|
|
},
|
|
{
|
|
"epoch": 6.191860465116279,
|
|
"grad_norm": 0.5080026242663115,
|
|
"learning_rate": 1.6081424352045093e-06,
|
|
"loss": 0.2165,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09645294398069382,
|
|
"step": 4260,
|
|
"valid_targets_mean": 4101.6,
|
|
"valid_targets_min": 737
|
|
},
|
|
{
|
|
"epoch": 6.199127906976744,
|
|
"grad_norm": 0.5273845094067898,
|
|
"learning_rate": 1.5797850782014236e-06,
|
|
"loss": 0.2177,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1336199790239334,
|
|
"step": 4265,
|
|
"valid_targets_mean": 4568.8,
|
|
"valid_targets_min": 596
|
|
},
|
|
{
|
|
"epoch": 6.2063953488372094,
|
|
"grad_norm": 0.4797757782978097,
|
|
"learning_rate": 1.5516696882082704e-06,
|
|
"loss": 0.2202,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08058105409145355,
|
|
"step": 4270,
|
|
"valid_targets_mean": 3192.5,
|
|
"valid_targets_min": 662
|
|
},
|
|
{
|
|
"epoch": 6.213662790697675,
|
|
"grad_norm": 0.5417432832678817,
|
|
"learning_rate": 1.5237966345473942e-06,
|
|
"loss": 0.2238,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09182320535182953,
|
|
"step": 4275,
|
|
"valid_targets_mean": 3194.9,
|
|
"valid_targets_min": 803
|
|
},
|
|
{
|
|
"epoch": 6.22093023255814,
|
|
"grad_norm": 0.554513792637474,
|
|
"learning_rate": 1.4961662833578117e-06,
|
|
"loss": 0.2218,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11547038704156876,
|
|
"step": 4280,
|
|
"valid_targets_mean": 3828.1,
|
|
"valid_targets_min": 391
|
|
},
|
|
{
|
|
"epoch": 6.228197674418604,
|
|
"grad_norm": 0.5063980695402167,
|
|
"learning_rate": 1.4687789975904188e-06,
|
|
"loss": 0.2269,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10384702682495117,
|
|
"step": 4285,
|
|
"valid_targets_mean": 4186.2,
|
|
"valid_targets_min": 771
|
|
},
|
|
{
|
|
"epoch": 6.2354651162790695,
|
|
"grad_norm": 0.5851372180371623,
|
|
"learning_rate": 1.4416351370032077e-06,
|
|
"loss": 0.2202,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12599419057369232,
|
|
"step": 4290,
|
|
"valid_targets_mean": 4214.8,
|
|
"valid_targets_min": 701
|
|
},
|
|
{
|
|
"epoch": 6.242732558139535,
|
|
"grad_norm": 0.49149694835880525,
|
|
"learning_rate": 1.4147350581565644e-06,
|
|
"loss": 0.2265,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09488339722156525,
|
|
"step": 4295,
|
|
"valid_targets_mean": 4413.6,
|
|
"valid_targets_min": 3553
|
|
},
|
|
{
|
|
"epoch": 6.25,
|
|
"grad_norm": 0.5118955700863174,
|
|
"learning_rate": 1.3880791144085582e-06,
|
|
"loss": 0.2201,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10951229184865952,
|
|
"step": 4300,
|
|
"valid_targets_mean": 4576.1,
|
|
"valid_targets_min": 731
|
|
},
|
|
{
|
|
"epoch": 6.257267441860465,
|
|
"grad_norm": 0.5463767287892208,
|
|
"learning_rate": 1.3616676559103104e-06,
|
|
"loss": 0.2205,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10446491092443466,
|
|
"step": 4305,
|
|
"valid_targets_mean": 3518.8,
|
|
"valid_targets_min": 438
|
|
},
|
|
{
|
|
"epoch": 6.2645348837209305,
|
|
"grad_norm": 0.49764498999090684,
|
|
"learning_rate": 1.3355010296014114e-06,
|
|
"loss": 0.2214,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08116332441568375,
|
|
"step": 4310,
|
|
"valid_targets_mean": 2714.1,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 6.271802325581396,
|
|
"grad_norm": 0.5963734494507665,
|
|
"learning_rate": 1.3095795792053333e-06,
|
|
"loss": 0.2213,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11170788109302521,
|
|
"step": 4315,
|
|
"valid_targets_mean": 2810.2,
|
|
"valid_targets_min": 533
|
|
},
|
|
{
|
|
"epoch": 6.27906976744186,
|
|
"grad_norm": 0.5953286940405174,
|
|
"learning_rate": 1.2839036452249354e-06,
|
|
"loss": 0.2246,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10700145363807678,
|
|
"step": 4320,
|
|
"valid_targets_mean": 2889.1,
|
|
"valid_targets_min": 519
|
|
},
|
|
{
|
|
"epoch": 6.286337209302325,
|
|
"grad_norm": 0.50442415172854,
|
|
"learning_rate": 1.258473564937981e-06,
|
|
"loss": 0.2174,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09842683374881744,
|
|
"step": 4325,
|
|
"valid_targets_mean": 3742.9,
|
|
"valid_targets_min": 498
|
|
},
|
|
{
|
|
"epoch": 6.2936046511627906,
|
|
"grad_norm": 0.5110182940973045,
|
|
"learning_rate": 1.2332896723927257e-06,
|
|
"loss": 0.2206,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1370856612920761,
|
|
"step": 4330,
|
|
"valid_targets_mean": 4617.8,
|
|
"valid_targets_min": 603
|
|
},
|
|
{
|
|
"epoch": 6.300872093023256,
|
|
"grad_norm": 0.5524502877034365,
|
|
"learning_rate": 1.2083522984035012e-06,
|
|
"loss": 0.2214,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10689415782690048,
|
|
"step": 4335,
|
|
"valid_targets_mean": 4125.2,
|
|
"valid_targets_min": 687
|
|
},
|
|
{
|
|
"epoch": 6.308139534883721,
|
|
"grad_norm": 0.5041840537184159,
|
|
"learning_rate": 1.183661770546387e-06,
|
|
"loss": 0.2205,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1000676080584526,
|
|
"step": 4340,
|
|
"valid_targets_mean": 4452.4,
|
|
"valid_targets_min": 634
|
|
},
|
|
{
|
|
"epoch": 6.315406976744186,
|
|
"grad_norm": 0.5507381719553612,
|
|
"learning_rate": 1.1592184131549056e-06,
|
|
"loss": 0.2246,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10032293200492859,
|
|
"step": 4345,
|
|
"valid_targets_mean": 3549.0,
|
|
"valid_targets_min": 799
|
|
},
|
|
{
|
|
"epoch": 6.3226744186046515,
|
|
"grad_norm": 0.6529547645313896,
|
|
"learning_rate": 1.1350225473157672e-06,
|
|
"loss": 0.2159,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11068548262119293,
|
|
"step": 4350,
|
|
"valid_targets_mean": 2916.9,
|
|
"valid_targets_min": 594
|
|
},
|
|
{
|
|
"epoch": 6.329941860465116,
|
|
"grad_norm": 0.5210812553212651,
|
|
"learning_rate": 1.1110744908646365e-06,
|
|
"loss": 0.2126,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0965781882405281,
|
|
"step": 4355,
|
|
"valid_targets_mean": 3368.5,
|
|
"valid_targets_min": 430
|
|
},
|
|
{
|
|
"epoch": 6.337209302325581,
|
|
"grad_norm": 0.5332519718749112,
|
|
"learning_rate": 1.0873745583819661e-06,
|
|
"loss": 0.2242,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1284990906715393,
|
|
"step": 4360,
|
|
"valid_targets_mean": 4401.9,
|
|
"valid_targets_min": 506
|
|
},
|
|
{
|
|
"epoch": 6.344476744186046,
|
|
"grad_norm": 0.591577869670093,
|
|
"learning_rate": 1.063923061188874e-06,
|
|
"loss": 0.2175,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09908381849527359,
|
|
"step": 4365,
|
|
"valid_targets_mean": 3131.2,
|
|
"valid_targets_min": 692
|
|
},
|
|
{
|
|
"epoch": 6.351744186046512,
|
|
"grad_norm": 0.491072911458214,
|
|
"learning_rate": 1.040720307343035e-06,
|
|
"loss": 0.2226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11375901103019714,
|
|
"step": 4370,
|
|
"valid_targets_mean": 3776.2,
|
|
"valid_targets_min": 611
|
|
},
|
|
{
|
|
"epoch": 6.359011627906977,
|
|
"grad_norm": 0.4770207504307759,
|
|
"learning_rate": 1.017766601634651e-06,
|
|
"loss": 0.2207,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10760487616062164,
|
|
"step": 4375,
|
|
"valid_targets_mean": 4155.9,
|
|
"valid_targets_min": 955
|
|
},
|
|
{
|
|
"epoch": 6.366279069767442,
|
|
"grad_norm": 0.5874644357170348,
|
|
"learning_rate": 9.95062245582432e-07,
|
|
"loss": 0.218,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11503146588802338,
|
|
"step": 4380,
|
|
"valid_targets_mean": 3213.0,
|
|
"valid_targets_min": 708
|
|
},
|
|
{
|
|
"epoch": 6.373546511627907,
|
|
"grad_norm": 0.5843827386614309,
|
|
"learning_rate": 9.72607537429655e-07,
|
|
"loss": 0.2113,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08797569572925568,
|
|
"step": 4385,
|
|
"valid_targets_mean": 2145.5,
|
|
"valid_targets_min": 603
|
|
},
|
|
{
|
|
"epoch": 6.3808139534883725,
|
|
"grad_norm": 0.5332039227041807,
|
|
"learning_rate": 9.504027721402264e-07,
|
|
"loss": 0.2222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10198168456554413,
|
|
"step": 4390,
|
|
"valid_targets_mean": 3549.4,
|
|
"valid_targets_min": 646
|
|
},
|
|
{
|
|
"epoch": 6.388081395348837,
|
|
"grad_norm": 0.5561080394886057,
|
|
"learning_rate": 9.284482413948148e-07,
|
|
"loss": 0.2213,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09928165376186371,
|
|
"step": 4395,
|
|
"valid_targets_mean": 3426.6,
|
|
"valid_targets_min": 498
|
|
},
|
|
{
|
|
"epoch": 6.395348837209302,
|
|
"grad_norm": 0.5387550513714358,
|
|
"learning_rate": 9.067442335870313e-07,
|
|
"loss": 0.2175,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11906737089157104,
|
|
"step": 4400,
|
|
"valid_targets_mean": 4181.0,
|
|
"valid_targets_min": 700
|
|
},
|
|
{
|
|
"epoch": 6.402616279069767,
|
|
"grad_norm": 0.5325231325865825,
|
|
"learning_rate": 8.852910338196152e-07,
|
|
"loss": 0.2141,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11549727618694305,
|
|
"step": 4405,
|
|
"valid_targets_mean": 3811.0,
|
|
"valid_targets_min": 755
|
|
},
|
|
{
|
|
"epoch": 6.409883720930233,
|
|
"grad_norm": 0.6373446805590439,
|
|
"learning_rate": 8.640889239007166e-07,
|
|
"loss": 0.222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14769718050956726,
|
|
"step": 4410,
|
|
"valid_targets_mean": 4159.0,
|
|
"valid_targets_min": 647
|
|
},
|
|
{
|
|
"epoch": 6.417151162790698,
|
|
"grad_norm": 0.5824414070647802,
|
|
"learning_rate": 8.431381823401708e-07,
|
|
"loss": 0.2209,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12444661557674408,
|
|
"step": 4415,
|
|
"valid_targets_mean": 4532.4,
|
|
"valid_targets_min": 709
|
|
},
|
|
{
|
|
"epoch": 6.424418604651163,
|
|
"grad_norm": 0.5213493346535095,
|
|
"learning_rate": 8.224390843458652e-07,
|
|
"loss": 0.2207,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08908454328775406,
|
|
"step": 4420,
|
|
"valid_targets_mean": 3492.6,
|
|
"valid_targets_min": 784
|
|
},
|
|
{
|
|
"epoch": 6.4316860465116275,
|
|
"grad_norm": 0.5660283158101067,
|
|
"learning_rate": 8.019919018201005e-07,
|
|
"loss": 0.22,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.07104974240064621,
|
|
"step": 4425,
|
|
"valid_targets_mean": 2456.0,
|
|
"valid_targets_min": 417
|
|
},
|
|
{
|
|
"epoch": 6.438953488372093,
|
|
"grad_norm": 0.5321869433718921,
|
|
"learning_rate": 7.817969033560246e-07,
|
|
"loss": 0.2226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11819642782211304,
|
|
"step": 4430,
|
|
"valid_targets_mean": 4258.0,
|
|
"valid_targets_min": 446
|
|
},
|
|
{
|
|
"epoch": 6.446220930232558,
|
|
"grad_norm": 0.4867961180366948,
|
|
"learning_rate": 7.618543542341217e-07,
|
|
"loss": 0.2168,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0961524099111557,
|
|
"step": 4435,
|
|
"valid_targets_mean": 3816.1,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 6.453488372093023,
|
|
"grad_norm": 0.5508115967507313,
|
|
"learning_rate": 7.421645164187019e-07,
|
|
"loss": 0.2207,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.07896394282579422,
|
|
"step": 4440,
|
|
"valid_targets_mean": 2026.9,
|
|
"valid_targets_min": 671
|
|
},
|
|
{
|
|
"epoch": 6.460755813953488,
|
|
"grad_norm": 0.5667325021853805,
|
|
"learning_rate": 7.227276485544798e-07,
|
|
"loss": 0.2136,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12289373576641083,
|
|
"step": 4445,
|
|
"valid_targets_mean": 3741.6,
|
|
"valid_targets_min": 617
|
|
},
|
|
{
|
|
"epoch": 6.468023255813954,
|
|
"grad_norm": 0.5400905479292796,
|
|
"learning_rate": 7.035440059631616e-07,
|
|
"loss": 0.2087,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0943833738565445,
|
|
"step": 4450,
|
|
"valid_targets_mean": 3401.0,
|
|
"valid_targets_min": 485
|
|
},
|
|
{
|
|
"epoch": 6.475290697674419,
|
|
"grad_norm": 0.5008963346942175,
|
|
"learning_rate": 6.846138406401137e-07,
|
|
"loss": 0.224,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09646037220954895,
|
|
"step": 4455,
|
|
"valid_targets_mean": 3926.9,
|
|
"valid_targets_min": 679
|
|
},
|
|
{
|
|
"epoch": 6.482558139534884,
|
|
"grad_norm": 0.6244635618997402,
|
|
"learning_rate": 6.6593740125102e-07,
|
|
"loss": 0.2215,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12762530148029327,
|
|
"step": 4460,
|
|
"valid_targets_mean": 3475.9,
|
|
"valid_targets_min": 561
|
|
},
|
|
{
|
|
"epoch": 6.4898255813953485,
|
|
"grad_norm": 0.6847427969655168,
|
|
"learning_rate": 6.475149331286457e-07,
|
|
"loss": 0.2219,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10304777324199677,
|
|
"step": 4465,
|
|
"valid_targets_mean": 2130.4,
|
|
"valid_targets_min": 689
|
|
},
|
|
{
|
|
"epoch": 6.497093023255814,
|
|
"grad_norm": 0.4907430697763535,
|
|
"learning_rate": 6.293466782696001e-07,
|
|
"loss": 0.2244,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09903063625097275,
|
|
"step": 4470,
|
|
"valid_targets_mean": 4228.6,
|
|
"valid_targets_min": 858
|
|
},
|
|
{
|
|
"epoch": 6.504360465116279,
|
|
"grad_norm": 0.4878310457069805,
|
|
"learning_rate": 6.114328753311572e-07,
|
|
"loss": 0.2307,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08721013367176056,
|
|
"step": 4475,
|
|
"valid_targets_mean": 3588.0,
|
|
"valid_targets_min": 589
|
|
},
|
|
{
|
|
"epoch": 6.511627906976744,
|
|
"grad_norm": 0.6392602373957003,
|
|
"learning_rate": 5.937737596281223e-07,
|
|
"loss": 0.2319,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1122431606054306,
|
|
"step": 4480,
|
|
"valid_targets_mean": 2587.9,
|
|
"valid_targets_min": 468
|
|
},
|
|
{
|
|
"epoch": 6.5188953488372094,
|
|
"grad_norm": 0.6956929712450983,
|
|
"learning_rate": 5.763695631297483e-07,
|
|
"loss": 0.2294,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1025511771440506,
|
|
"step": 4485,
|
|
"valid_targets_mean": 2927.0,
|
|
"valid_targets_min": 710
|
|
},
|
|
{
|
|
"epoch": 6.526162790697675,
|
|
"grad_norm": 0.5589149132557204,
|
|
"learning_rate": 5.592205144566753e-07,
|
|
"loss": 0.2073,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11511734127998352,
|
|
"step": 4490,
|
|
"valid_targets_mean": 4215.8,
|
|
"valid_targets_min": 260
|
|
},
|
|
{
|
|
"epoch": 6.533430232558139,
|
|
"grad_norm": 0.5601364320314534,
|
|
"learning_rate": 5.423268388779424e-07,
|
|
"loss": 0.2227,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10099512338638306,
|
|
"step": 4495,
|
|
"valid_targets_mean": 3608.0,
|
|
"valid_targets_min": 665
|
|
},
|
|
{
|
|
"epoch": 6.540697674418604,
|
|
"grad_norm": 0.4749372904201485,
|
|
"learning_rate": 5.256887583080094e-07,
|
|
"loss": 0.2109,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10849292576313019,
|
|
"step": 4500,
|
|
"valid_targets_mean": 4887.2,
|
|
"valid_targets_min": 4227
|
|
},
|
|
{
|
|
"epoch": 6.5479651162790695,
|
|
"grad_norm": 0.517398445885059,
|
|
"learning_rate": 5.093064913038648e-07,
|
|
"loss": 0.2118,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.0925350934267044,
|
|
"step": 4505,
|
|
"valid_targets_mean": 3727.9,
|
|
"valid_targets_min": 693
|
|
},
|
|
{
|
|
"epoch": 6.555232558139535,
|
|
"grad_norm": 0.4669579345900138,
|
|
"learning_rate": 4.931802530621376e-07,
|
|
"loss": 0.2096,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10471238940954208,
|
|
"step": 4510,
|
|
"valid_targets_mean": 4466.2,
|
|
"valid_targets_min": 721
|
|
},
|
|
{
|
|
"epoch": 6.5625,
|
|
"grad_norm": 0.5158823636602122,
|
|
"learning_rate": 4.773102554162768e-07,
|
|
"loss": 0.2288,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09145092964172363,
|
|
"step": 4515,
|
|
"valid_targets_mean": 3328.9,
|
|
"valid_targets_min": 439
|
|
},
|
|
{
|
|
"epoch": 6.569767441860465,
|
|
"grad_norm": 0.6807986618835836,
|
|
"learning_rate": 4.61696706833763e-07,
|
|
"loss": 0.215,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12569642066955566,
|
|
"step": 4520,
|
|
"valid_targets_mean": 3699.1,
|
|
"valid_targets_min": 623
|
|
},
|
|
{
|
|
"epoch": 6.5770348837209305,
|
|
"grad_norm": 0.5600951397322557,
|
|
"learning_rate": 4.4633981241338333e-07,
|
|
"loss": 0.2195,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13266706466674805,
|
|
"step": 4525,
|
|
"valid_targets_mean": 4428.1,
|
|
"valid_targets_min": 238
|
|
},
|
|
{
|
|
"epoch": 6.584302325581396,
|
|
"grad_norm": 0.5827853749348123,
|
|
"learning_rate": 4.312397738825236e-07,
|
|
"loss": 0.2258,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12651139497756958,
|
|
"step": 4530,
|
|
"valid_targets_mean": 3696.9,
|
|
"valid_targets_min": 587
|
|
},
|
|
{
|
|
"epoch": 6.591569767441861,
|
|
"grad_norm": 0.5438654554473624,
|
|
"learning_rate": 4.163967895945242e-07,
|
|
"loss": 0.2183,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12943975627422333,
|
|
"step": 4535,
|
|
"valid_targets_mean": 4721.0,
|
|
"valid_targets_min": 857
|
|
},
|
|
{
|
|
"epoch": 6.598837209302325,
|
|
"grad_norm": 0.4830117424828023,
|
|
"learning_rate": 4.0181105452607563e-07,
|
|
"loss": 0.2142,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11082278192043304,
|
|
"step": 4540,
|
|
"valid_targets_mean": 4415.0,
|
|
"valid_targets_min": 3320
|
|
},
|
|
{
|
|
"epoch": 6.6061046511627906,
|
|
"grad_norm": 0.5336132946381207,
|
|
"learning_rate": 3.874827602746556e-07,
|
|
"loss": 0.2184,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12187427282333374,
|
|
"step": 4545,
|
|
"valid_targets_mean": 4065.5,
|
|
"valid_targets_min": 577
|
|
},
|
|
{
|
|
"epoch": 6.613372093023256,
|
|
"grad_norm": 0.5781379453512802,
|
|
"learning_rate": 3.734120950560116e-07,
|
|
"loss": 0.2242,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1307642161846161,
|
|
"step": 4550,
|
|
"valid_targets_mean": 3438.9,
|
|
"valid_targets_min": 337
|
|
},
|
|
{
|
|
"epoch": 6.620639534883721,
|
|
"grad_norm": 0.5505669899387781,
|
|
"learning_rate": 3.5959924370168487e-07,
|
|
"loss": 0.2143,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08358632028102875,
|
|
"step": 4555,
|
|
"valid_targets_mean": 3144.0,
|
|
"valid_targets_min": 596
|
|
},
|
|
{
|
|
"epoch": 6.627906976744186,
|
|
"grad_norm": 0.5629291249358289,
|
|
"learning_rate": 3.4604438765659445e-07,
|
|
"loss": 0.2226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09669582545757294,
|
|
"step": 4560,
|
|
"valid_targets_mean": 2941.8,
|
|
"valid_targets_min": 529
|
|
},
|
|
{
|
|
"epoch": 6.6351744186046515,
|
|
"grad_norm": 0.5841625684995547,
|
|
"learning_rate": 3.3274770497664365e-07,
|
|
"loss": 0.2208,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13941574096679688,
|
|
"step": 4565,
|
|
"valid_targets_mean": 4221.9,
|
|
"valid_targets_min": 869
|
|
},
|
|
{
|
|
"epoch": 6.642441860465116,
|
|
"grad_norm": 0.5442309971971446,
|
|
"learning_rate": 3.1970937032638206e-07,
|
|
"loss": 0.2171,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08730822801589966,
|
|
"step": 4570,
|
|
"valid_targets_mean": 3145.8,
|
|
"valid_targets_min": 541
|
|
},
|
|
{
|
|
"epoch": 6.649709302325581,
|
|
"grad_norm": 0.6272064657031894,
|
|
"learning_rate": 3.0692955497670705e-07,
|
|
"loss": 0.2187,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10662917047739029,
|
|
"step": 4575,
|
|
"valid_targets_mean": 3310.1,
|
|
"valid_targets_min": 756
|
|
},
|
|
{
|
|
"epoch": 6.656976744186046,
|
|
"grad_norm": 0.5451476495831158,
|
|
"learning_rate": 2.944084268026326e-07,
|
|
"loss": 0.2285,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10781296342611313,
|
|
"step": 4580,
|
|
"valid_targets_mean": 2932.6,
|
|
"valid_targets_min": 589
|
|
},
|
|
{
|
|
"epoch": 6.664244186046512,
|
|
"grad_norm": 0.4471826485431661,
|
|
"learning_rate": 2.821461502810641e-07,
|
|
"loss": 0.2193,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12207210063934326,
|
|
"step": 4585,
|
|
"valid_targets_mean": 4912.2,
|
|
"valid_targets_min": 4070
|
|
},
|
|
{
|
|
"epoch": 6.671511627906977,
|
|
"grad_norm": 0.5301911172654994,
|
|
"learning_rate": 2.701428864886402e-07,
|
|
"loss": 0.211,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1026616096496582,
|
|
"step": 4590,
|
|
"valid_targets_mean": 3659.4,
|
|
"valid_targets_min": 751
|
|
},
|
|
{
|
|
"epoch": 6.678779069767442,
|
|
"grad_norm": 0.7337321372097355,
|
|
"learning_rate": 2.583987930996279e-07,
|
|
"loss": 0.2204,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10018828511238098,
|
|
"step": 4595,
|
|
"valid_targets_mean": 4107.9,
|
|
"valid_targets_min": 1046
|
|
},
|
|
{
|
|
"epoch": 6.686046511627907,
|
|
"grad_norm": 0.6997967805226685,
|
|
"learning_rate": 2.469140243838464e-07,
|
|
"loss": 0.2308,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11243093013763428,
|
|
"step": 4600,
|
|
"valid_targets_mean": 2284.9,
|
|
"valid_targets_min": 521
|
|
},
|
|
{
|
|
"epoch": 6.6933139534883725,
|
|
"grad_norm": 0.5247933139316745,
|
|
"learning_rate": 2.3568873120462854e-07,
|
|
"loss": 0.2237,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09087327122688293,
|
|
"step": 4605,
|
|
"valid_targets_mean": 3116.1,
|
|
"valid_targets_min": 581
|
|
},
|
|
{
|
|
"epoch": 6.700581395348837,
|
|
"grad_norm": 0.5013207071106418,
|
|
"learning_rate": 2.247230610168627e-07,
|
|
"loss": 0.2172,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12086968123912811,
|
|
"step": 4610,
|
|
"valid_targets_mean": 4454.2,
|
|
"valid_targets_min": 3719
|
|
},
|
|
{
|
|
"epoch": 6.707848837209302,
|
|
"grad_norm": 0.49047249454640285,
|
|
"learning_rate": 2.1401715786503408e-07,
|
|
"loss": 0.2064,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10399701446294785,
|
|
"step": 4615,
|
|
"valid_targets_mean": 4197.2,
|
|
"valid_targets_min": 968
|
|
},
|
|
{
|
|
"epoch": 6.715116279069767,
|
|
"grad_norm": 0.5270903466326124,
|
|
"learning_rate": 2.0357116238134633e-07,
|
|
"loss": 0.2172,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09298289567232132,
|
|
"step": 4620,
|
|
"valid_targets_mean": 3860.4,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 6.722383720930233,
|
|
"grad_norm": 0.5686367907075806,
|
|
"learning_rate": 1.9338521178386304e-07,
|
|
"loss": 0.2203,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13162291049957275,
|
|
"step": 4625,
|
|
"valid_targets_mean": 4046.5,
|
|
"valid_targets_min": 673
|
|
},
|
|
{
|
|
"epoch": 6.729651162790698,
|
|
"grad_norm": 0.5106997928463469,
|
|
"learning_rate": 1.8345943987471804e-07,
|
|
"loss": 0.2162,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.121708944439888,
|
|
"step": 4630,
|
|
"valid_targets_mean": 4563.0,
|
|
"valid_targets_min": 3324
|
|
},
|
|
{
|
|
"epoch": 6.736918604651163,
|
|
"grad_norm": 0.5831411162492427,
|
|
"learning_rate": 1.7379397703834788e-07,
|
|
"loss": 0.2122,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11596697568893433,
|
|
"step": 4635,
|
|
"valid_targets_mean": 3143.0,
|
|
"valid_targets_min": 696
|
|
},
|
|
{
|
|
"epoch": 6.7441860465116275,
|
|
"grad_norm": 0.5961973276477247,
|
|
"learning_rate": 1.643889502397844e-07,
|
|
"loss": 0.2259,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.129440039396286,
|
|
"step": 4640,
|
|
"valid_targets_mean": 2991.0,
|
|
"valid_targets_min": 630
|
|
},
|
|
{
|
|
"epoch": 6.751453488372093,
|
|
"grad_norm": 0.5907922312322912,
|
|
"learning_rate": 1.5524448302297822e-07,
|
|
"loss": 0.2249,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13513025641441345,
|
|
"step": 4645,
|
|
"valid_targets_mean": 4267.2,
|
|
"valid_targets_min": 834
|
|
},
|
|
{
|
|
"epoch": 6.758720930232558,
|
|
"grad_norm": 0.5781430139225441,
|
|
"learning_rate": 1.4636069550919118e-07,
|
|
"loss": 0.2201,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13518787920475006,
|
|
"step": 4650,
|
|
"valid_targets_mean": 4008.6,
|
|
"valid_targets_min": 633
|
|
},
|
|
{
|
|
"epoch": 6.765988372093023,
|
|
"grad_norm": 0.6234589323531933,
|
|
"learning_rate": 1.3773770439540646e-07,
|
|
"loss": 0.2267,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12242134660482407,
|
|
"step": 4655,
|
|
"valid_targets_mean": 3451.1,
|
|
"valid_targets_min": 562
|
|
},
|
|
{
|
|
"epoch": 6.773255813953488,
|
|
"grad_norm": 0.5007798140831097,
|
|
"learning_rate": 1.2937562295279648e-07,
|
|
"loss": 0.2163,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09039414674043655,
|
|
"step": 4660,
|
|
"valid_targets_mean": 3912.1,
|
|
"valid_targets_min": 882
|
|
},
|
|
{
|
|
"epoch": 6.780523255813954,
|
|
"grad_norm": 0.5885595688241299,
|
|
"learning_rate": 1.2127456102523748e-07,
|
|
"loss": 0.2263,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10255330055952072,
|
|
"step": 4665,
|
|
"valid_targets_mean": 2942.2,
|
|
"valid_targets_min": 464
|
|
},
|
|
{
|
|
"epoch": 6.787790697674419,
|
|
"grad_norm": 0.562684289446446,
|
|
"learning_rate": 1.1343462502787506e-07,
|
|
"loss": 0.2252,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13460709154605865,
|
|
"step": 4670,
|
|
"valid_targets_mean": 3817.2,
|
|
"valid_targets_min": 600
|
|
},
|
|
{
|
|
"epoch": 6.795058139534884,
|
|
"grad_norm": 0.6026537059681291,
|
|
"learning_rate": 1.0585591794570527e-07,
|
|
"loss": 0.2193,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1313938945531845,
|
|
"step": 4675,
|
|
"valid_targets_mean": 3602.8,
|
|
"valid_targets_min": 763
|
|
},
|
|
{
|
|
"epoch": 6.8023255813953485,
|
|
"grad_norm": 0.5853621048092735,
|
|
"learning_rate": 9.853853933224244e-08,
|
|
"loss": 0.2213,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10932928323745728,
|
|
"step": 4680,
|
|
"valid_targets_mean": 3041.2,
|
|
"valid_targets_min": 698
|
|
},
|
|
{
|
|
"epoch": 6.809593023255814,
|
|
"grad_norm": 0.6080383955492051,
|
|
"learning_rate": 9.14825853082002e-08,
|
|
"loss": 0.2186,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11644819378852844,
|
|
"step": 4685,
|
|
"valid_targets_mean": 3385.8,
|
|
"valid_targets_min": 605
|
|
},
|
|
{
|
|
"epoch": 6.816860465116279,
|
|
"grad_norm": 0.4775678543427417,
|
|
"learning_rate": 8.468814856023466e-08,
|
|
"loss": 0.2116,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1143902912735939,
|
|
"step": 4690,
|
|
"valid_targets_mean": 5123.6,
|
|
"valid_targets_min": 3314
|
|
},
|
|
{
|
|
"epoch": 6.824127906976744,
|
|
"grad_norm": 0.528062844579276,
|
|
"learning_rate": 7.815531833972323e-08,
|
|
"loss": 0.2293,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10117469727993011,
|
|
"step": 4695,
|
|
"valid_targets_mean": 3858.6,
|
|
"valid_targets_min": 412
|
|
},
|
|
{
|
|
"epoch": 6.8313953488372094,
|
|
"grad_norm": 0.5341213195324499,
|
|
"learning_rate": 7.188418046158996e-08,
|
|
"loss": 0.2206,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1261979341506958,
|
|
"step": 4700,
|
|
"valid_targets_mean": 4170.6,
|
|
"valid_targets_min": 622
|
|
},
|
|
{
|
|
"epoch": 6.838662790697675,
|
|
"grad_norm": 0.5077496161516507,
|
|
"learning_rate": 6.587481730318645e-08,
|
|
"loss": 0.2113,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11185050010681152,
|
|
"step": 4705,
|
|
"valid_targets_mean": 4248.8,
|
|
"valid_targets_min": 1089
|
|
},
|
|
{
|
|
"epoch": 6.845930232558139,
|
|
"grad_norm": 0.4752393870528188,
|
|
"learning_rate": 6.012730780320163e-08,
|
|
"loss": 0.2271,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12355662882328033,
|
|
"step": 4710,
|
|
"valid_targets_mean": 5046.0,
|
|
"valid_targets_min": 934
|
|
},
|
|
{
|
|
"epoch": 6.853197674418604,
|
|
"grad_norm": 0.5391686062982739,
|
|
"learning_rate": 5.4641727460631455e-08,
|
|
"loss": 0.2208,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11547373980283737,
|
|
"step": 4715,
|
|
"valid_targets_mean": 3947.9,
|
|
"valid_targets_min": 562
|
|
},
|
|
{
|
|
"epoch": 6.8604651162790695,
|
|
"grad_norm": 0.5353702001037038,
|
|
"learning_rate": 4.941814833377745e-08,
|
|
"loss": 0.2174,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1061892881989479,
|
|
"step": 4720,
|
|
"valid_targets_mean": 3186.4,
|
|
"valid_targets_min": 745
|
|
},
|
|
{
|
|
"epoch": 6.867732558139535,
|
|
"grad_norm": 0.5141334293805976,
|
|
"learning_rate": 4.445663903931419e-08,
|
|
"loss": 0.2141,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.07714653015136719,
|
|
"step": 4725,
|
|
"valid_targets_mean": 3283.6,
|
|
"valid_targets_min": 512
|
|
},
|
|
{
|
|
"epoch": 6.875,
|
|
"grad_norm": 0.6642814032204781,
|
|
"learning_rate": 3.975726475137443e-08,
|
|
"loss": 0.2245,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1309489905834198,
|
|
"step": 4730,
|
|
"valid_targets_mean": 2474.1,
|
|
"valid_targets_min": 522
|
|
},
|
|
{
|
|
"epoch": 6.882267441860465,
|
|
"grad_norm": 0.6511885413405972,
|
|
"learning_rate": 3.5320087200698686e-08,
|
|
"loss": 0.226,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.14132645726203918,
|
|
"step": 4735,
|
|
"valid_targets_mean": 3458.9,
|
|
"valid_targets_min": 672
|
|
},
|
|
{
|
|
"epoch": 6.8895348837209305,
|
|
"grad_norm": 0.635448048551765,
|
|
"learning_rate": 3.114516467383144e-08,
|
|
"loss": 0.2203,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.10060547292232513,
|
|
"step": 4740,
|
|
"valid_targets_mean": 2998.4,
|
|
"valid_targets_min": 520
|
|
},
|
|
{
|
|
"epoch": 6.896802325581396,
|
|
"grad_norm": 0.5539102046278637,
|
|
"learning_rate": 2.7232552012339542e-08,
|
|
"loss": 0.2222,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08430768549442291,
|
|
"step": 4745,
|
|
"valid_targets_mean": 2591.6,
|
|
"valid_targets_min": 300
|
|
},
|
|
{
|
|
"epoch": 6.904069767441861,
|
|
"grad_norm": 0.48564974306250575,
|
|
"learning_rate": 2.358230061210387e-08,
|
|
"loss": 0.2166,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12091777473688126,
|
|
"step": 4750,
|
|
"valid_targets_mean": 4487.0,
|
|
"valid_targets_min": 1123
|
|
},
|
|
{
|
|
"epoch": 6.911337209302325,
|
|
"grad_norm": 0.486240918272119,
|
|
"learning_rate": 2.0194458422646557e-08,
|
|
"loss": 0.2075,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09467769414186478,
|
|
"step": 4755,
|
|
"valid_targets_mean": 3418.2,
|
|
"valid_targets_min": 744
|
|
},
|
|
{
|
|
"epoch": 6.9186046511627906,
|
|
"grad_norm": 0.5006300347186905,
|
|
"learning_rate": 1.706906994648705e-08,
|
|
"loss": 0.2144,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11444921046495438,
|
|
"step": 4760,
|
|
"valid_targets_mean": 4181.8,
|
|
"valid_targets_min": 673
|
|
},
|
|
{
|
|
"epoch": 6.925872093023256,
|
|
"grad_norm": 0.5326767776519343,
|
|
"learning_rate": 1.4206176238571457e-08,
|
|
"loss": 0.2132,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09992027282714844,
|
|
"step": 4765,
|
|
"valid_targets_mean": 3968.4,
|
|
"valid_targets_min": 807
|
|
},
|
|
{
|
|
"epoch": 6.933139534883721,
|
|
"grad_norm": 0.6524069067054485,
|
|
"learning_rate": 1.160581490572632e-08,
|
|
"loss": 0.2348,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1270563006401062,
|
|
"step": 4770,
|
|
"valid_targets_mean": 3597.4,
|
|
"valid_targets_min": 778
|
|
},
|
|
{
|
|
"epoch": 6.940406976744186,
|
|
"grad_norm": 0.5455272591274605,
|
|
"learning_rate": 9.268020106167896e-09,
|
|
"loss": 0.2142,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09810951352119446,
|
|
"step": 4775,
|
|
"valid_targets_mean": 3681.2,
|
|
"valid_targets_min": 599
|
|
},
|
|
{
|
|
"epoch": 6.9476744186046515,
|
|
"grad_norm": 0.5273676324333582,
|
|
"learning_rate": 7.192822549046963e-09,
|
|
"loss": 0.2155,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.11775662750005722,
|
|
"step": 4780,
|
|
"valid_targets_mean": 4525.5,
|
|
"valid_targets_min": 634
|
|
},
|
|
{
|
|
"epoch": 6.954941860465116,
|
|
"grad_norm": 0.5131194731831497,
|
|
"learning_rate": 5.38024949405358e-09,
|
|
"loss": 0.2268,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09795769304037094,
|
|
"step": 4785,
|
|
"valid_targets_mean": 3921.0,
|
|
"valid_targets_min": 696
|
|
},
|
|
{
|
|
"epoch": 6.962209302325581,
|
|
"grad_norm": 0.5857771734829496,
|
|
"learning_rate": 3.8303247510596e-09,
|
|
"loss": 0.2196,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12851554155349731,
|
|
"step": 4790,
|
|
"valid_targets_mean": 4447.5,
|
|
"valid_targets_min": 1117
|
|
},
|
|
{
|
|
"epoch": 6.969476744186046,
|
|
"grad_norm": 0.5688605253517679,
|
|
"learning_rate": 2.5430686797944803e-09,
|
|
"loss": 0.2158,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09657136350870132,
|
|
"step": 4795,
|
|
"valid_targets_mean": 3530.4,
|
|
"valid_targets_min": 874
|
|
},
|
|
{
|
|
"epoch": 6.976744186046512,
|
|
"grad_norm": 0.6648295757131324,
|
|
"learning_rate": 1.5184981895899342e-09,
|
|
"loss": 0.2137,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.1428152322769165,
|
|
"step": 4800,
|
|
"valid_targets_mean": 3244.0,
|
|
"valid_targets_min": 636
|
|
},
|
|
{
|
|
"epoch": 6.984011627906977,
|
|
"grad_norm": 0.5347563819472954,
|
|
"learning_rate": 7.566267391512228e-10,
|
|
"loss": 0.2238,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.09766152501106262,
|
|
"step": 4805,
|
|
"valid_targets_mean": 3221.5,
|
|
"valid_targets_min": 571
|
|
},
|
|
{
|
|
"epoch": 6.991279069767442,
|
|
"grad_norm": 0.5588348867166488,
|
|
"learning_rate": 2.574643363839613e-10,
|
|
"loss": 0.2351,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.13627320528030396,
|
|
"step": 4810,
|
|
"valid_targets_mean": 3636.0,
|
|
"valid_targets_min": 547
|
|
},
|
|
{
|
|
"epoch": 6.998546511627907,
|
|
"grad_norm": 0.5159770970836671,
|
|
"learning_rate": 2.1017538260892367e-11,
|
|
"loss": 0.2106,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.08966579288244247,
|
|
"step": 4815,
|
|
"valid_targets_mean": 3309.4,
|
|
"valid_targets_min": 567
|
|
},
|
|
{
|
|
"epoch": 7.0,
|
|
"loss_nan_ranks": 0,
|
|
"loss_rank_avg": 0.12460079044103622,
|
|
"step": 4816,
|
|
"total_flos": 2.3699064220633006e+18,
|
|
"train_loss": 0.2668512877930834,
|
|
"train_runtime": 60502.9208,
|
|
"train_samples_per_second": 1.273,
|
|
"train_steps_per_second": 0.08,
|
|
"valid_targets_mean": 4185.4,
|
|
"valid_targets_min": 557
|
|
}
|
|
],
|
|
"logging_steps": 5,
|
|
"max_steps": 4816,
|
|
"num_input_tokens_seen": 0,
|
|
"num_train_epochs": 7,
|
|
"save_steps": 1500,
|
|
"stateful_callbacks": {
|
|
"TrainerControl": {
|
|
"args": {
|
|
"should_epoch_stop": false,
|
|
"should_evaluate": false,
|
|
"should_log": false,
|
|
"should_save": true,
|
|
"should_training_stop": true
|
|
},
|
|
"attributes": {}
|
|
}
|
|
},
|
|
"total_flos": 2.3699064220633006e+18,
|
|
"train_batch_size": 1,
|
|
"trial_name": null,
|
|
"trial_params": null
|
|
}
|