{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 5.0, "eval_steps": 500, "global_step": 3040, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008228195282501372, "grad_norm": 13.661592714819882, "learning_rate": 5.263157894736843e-07, "loss": 0.9672, "loss_nan_ranks": 0, "loss_rank_avg": 0.33080172538757324, "step": 5, "valid_targets_mean": 8170.6, "valid_targets_min": 3077 }, { "epoch": 0.016456390565002744, "grad_norm": 11.927844187875976, "learning_rate": 1.1842105263157894e-06, "loss": 0.9636, "loss_nan_ranks": 0, "loss_rank_avg": 0.30587294697761536, "step": 10, "valid_targets_mean": 6980.7, "valid_targets_min": 2298 }, { "epoch": 0.024684585847504114, "grad_norm": 6.744886263610615, "learning_rate": 1.8421052631578948e-06, "loss": 0.9073, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631882429122925, "step": 15, "valid_targets_mean": 6148.2, "valid_targets_min": 2167 }, { "epoch": 0.03291278113000549, "grad_norm": 2.892063783530988, "learning_rate": 2.5e-06, "loss": 0.8329, "loss_nan_ranks": 0, "loss_rank_avg": 0.280141681432724, "step": 20, "valid_targets_mean": 7165.8, "valid_targets_min": 2278 }, { "epoch": 0.04114097641250686, "grad_norm": 1.7886922348255612, "learning_rate": 3.157894736842105e-06, "loss": 0.7725, "loss_nan_ranks": 0, "loss_rank_avg": 0.25607916712760925, "step": 25, "valid_targets_mean": 7202.3, "valid_targets_min": 2907 }, { "epoch": 0.04936917169500823, "grad_norm": 1.4610050364093832, "learning_rate": 3.815789473684211e-06, "loss": 0.7477, "loss_nan_ranks": 0, "loss_rank_avg": 0.24936680495738983, "step": 30, "valid_targets_mean": 7477.5, "valid_targets_min": 2714 }, { "epoch": 0.0575973669775096, "grad_norm": 0.9352394471095702, "learning_rate": 4.473684210526316e-06, "loss": 0.7078, "loss_nan_ranks": 0, "loss_rank_avg": 0.23676790297031403, "step": 35, "valid_targets_mean": 7314.0, "valid_targets_min": 2883 }, { "epoch": 0.06582556226001098, "grad_norm": 0.7295427249654216, "learning_rate": 5.131578947368422e-06, "loss": 0.6618, "loss_nan_ranks": 0, "loss_rank_avg": 0.21210411190986633, "step": 40, "valid_targets_mean": 7126.6, "valid_targets_min": 2597 }, { "epoch": 0.07405375754251234, "grad_norm": 0.6133963494588915, "learning_rate": 5.789473684210527e-06, "loss": 0.6337, "loss_nan_ranks": 0, "loss_rank_avg": 0.19923362135887146, "step": 45, "valid_targets_mean": 7369.8, "valid_targets_min": 3375 }, { "epoch": 0.08228195282501372, "grad_norm": 0.4495388936542107, "learning_rate": 6.447368421052632e-06, "loss": 0.5998, "loss_nan_ranks": 0, "loss_rank_avg": 0.19039945304393768, "step": 50, "valid_targets_mean": 7356.4, "valid_targets_min": 2005 }, { "epoch": 0.09051014810751508, "grad_norm": 0.3995911861766218, "learning_rate": 7.1052631578947375e-06, "loss": 0.5558, "loss_nan_ranks": 0, "loss_rank_avg": 0.17436350882053375, "step": 55, "valid_targets_mean": 8719.0, "valid_targets_min": 589 }, { "epoch": 0.09873834339001646, "grad_norm": 0.3499717213397111, "learning_rate": 7.763157894736843e-06, "loss": 0.5219, "loss_nan_ranks": 0, "loss_rank_avg": 0.18273428082466125, "step": 60, "valid_targets_mean": 9029.5, "valid_targets_min": 4655 }, { "epoch": 0.10696653867251783, "grad_norm": 0.26109198291101654, "learning_rate": 8.421052631578948e-06, "loss": 0.4966, "loss_nan_ranks": 0, "loss_rank_avg": 0.16715273261070251, "step": 65, "valid_targets_mean": 10019.8, "valid_targets_min": 4996 }, { "epoch": 0.1151947339550192, "grad_norm": 0.24495980513506116, "learning_rate": 9.078947368421054e-06, "loss": 0.4791, "loss_nan_ranks": 0, "loss_rank_avg": 0.15863889455795288, "step": 70, "valid_targets_mean": 9413.2, "valid_targets_min": 3337 }, { "epoch": 0.12342292923752057, "grad_norm": 0.27613600523015236, "learning_rate": 9.736842105263159e-06, "loss": 0.4742, "loss_nan_ranks": 0, "loss_rank_avg": 0.16512612998485565, "step": 75, "valid_targets_mean": 10127.1, "valid_targets_min": 3360 }, { "epoch": 0.13165112452002195, "grad_norm": 0.22054068931113005, "learning_rate": 1.0394736842105264e-05, "loss": 0.4552, "loss_nan_ranks": 0, "loss_rank_avg": 0.16071820259094238, "step": 80, "valid_targets_mean": 9319.1, "valid_targets_min": 685 }, { "epoch": 0.1398793198025233, "grad_norm": 0.2616751014414881, "learning_rate": 1.105263157894737e-05, "loss": 0.4578, "loss_nan_ranks": 0, "loss_rank_avg": 0.15120165050029755, "step": 85, "valid_targets_mean": 9109.9, "valid_targets_min": 4379 }, { "epoch": 0.14810751508502468, "grad_norm": 0.25389258411623156, "learning_rate": 1.1710526315789475e-05, "loss": 0.443, "loss_nan_ranks": 0, "loss_rank_avg": 0.14307349920272827, "step": 90, "valid_targets_mean": 9313.2, "valid_targets_min": 3452 }, { "epoch": 0.15633571036752605, "grad_norm": 0.25388019851426047, "learning_rate": 1.236842105263158e-05, "loss": 0.4362, "loss_nan_ranks": 0, "loss_rank_avg": 0.14230628311634064, "step": 95, "valid_targets_mean": 8640.9, "valid_targets_min": 383 }, { "epoch": 0.16456390565002743, "grad_norm": 0.2405595523038858, "learning_rate": 1.3026315789473684e-05, "loss": 0.4342, "loss_nan_ranks": 0, "loss_rank_avg": 0.14278680086135864, "step": 100, "valid_targets_mean": 9029.9, "valid_targets_min": 4552 }, { "epoch": 0.1727921009325288, "grad_norm": 0.22176898805086837, "learning_rate": 1.3684210526315791e-05, "loss": 0.4262, "loss_nan_ranks": 0, "loss_rank_avg": 0.14409483969211578, "step": 105, "valid_targets_mean": 10390.2, "valid_targets_min": 4833 }, { "epoch": 0.18102029621503016, "grad_norm": 0.243090924751181, "learning_rate": 1.4342105263157895e-05, "loss": 0.4172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1436709314584732, "step": 110, "valid_targets_mean": 9771.6, "valid_targets_min": 3641 }, { "epoch": 0.18924849149753153, "grad_norm": 0.2625711173343529, "learning_rate": 1.5000000000000002e-05, "loss": 0.4153, "loss_nan_ranks": 0, "loss_rank_avg": 0.1286260485649109, "step": 115, "valid_targets_mean": 9316.0, "valid_targets_min": 1929 }, { "epoch": 0.1974766867800329, "grad_norm": 0.22939426799124796, "learning_rate": 1.5657894736842107e-05, "loss": 0.4154, "loss_nan_ranks": 0, "loss_rank_avg": 0.13896283507347107, "step": 120, "valid_targets_mean": 9838.7, "valid_targets_min": 4324 }, { "epoch": 0.2057048820625343, "grad_norm": 0.24963282482796506, "learning_rate": 1.6315789473684213e-05, "loss": 0.4208, "loss_nan_ranks": 0, "loss_rank_avg": 0.14296197891235352, "step": 125, "valid_targets_mean": 9693.1, "valid_targets_min": 3811 }, { "epoch": 0.21393307734503567, "grad_norm": 0.30535130323003906, "learning_rate": 1.6973684210526318e-05, "loss": 0.4063, "loss_nan_ranks": 0, "loss_rank_avg": 0.12299084663391113, "step": 130, "valid_targets_mean": 9686.9, "valid_targets_min": 3338 }, { "epoch": 0.22216127262753702, "grad_norm": 0.284400177589226, "learning_rate": 1.763157894736842e-05, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.123782217502594, "step": 135, "valid_targets_mean": 9590.6, "valid_targets_min": 4785 }, { "epoch": 0.2303894679100384, "grad_norm": 0.23276724546182528, "learning_rate": 1.828947368421053e-05, "loss": 0.3988, "loss_nan_ranks": 0, "loss_rank_avg": 0.14101338386535645, "step": 140, "valid_targets_mean": 10718.9, "valid_targets_min": 4892 }, { "epoch": 0.23861766319253977, "grad_norm": 0.26025681943282925, "learning_rate": 1.894736842105263e-05, "loss": 0.4023, "loss_nan_ranks": 0, "loss_rank_avg": 0.1524072289466858, "step": 145, "valid_targets_mean": 10753.2, "valid_targets_min": 3836 }, { "epoch": 0.24684585847504115, "grad_norm": 0.2358512322697237, "learning_rate": 1.960526315789474e-05, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.11710461974143982, "step": 150, "valid_targets_mean": 8877.9, "valid_targets_min": 424 }, { "epoch": 0.2550740537575425, "grad_norm": 0.23568354731119345, "learning_rate": 2.0263157894736842e-05, "loss": 0.3967, "loss_nan_ranks": 0, "loss_rank_avg": 0.14156289398670197, "step": 155, "valid_targets_mean": 11518.0, "valid_targets_min": 4504 }, { "epoch": 0.2633022490400439, "grad_norm": 0.26669374560220394, "learning_rate": 2.0921052631578947e-05, "loss": 0.3946, "loss_nan_ranks": 0, "loss_rank_avg": 0.14294372498989105, "step": 160, "valid_targets_mean": 10316.1, "valid_targets_min": 4842 }, { "epoch": 0.27153044432254525, "grad_norm": 0.24067166137023635, "learning_rate": 2.1578947368421056e-05, "loss": 0.3925, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319475769996643, "step": 165, "valid_targets_mean": 10630.5, "valid_targets_min": 5085 }, { "epoch": 0.2797586396050466, "grad_norm": 0.24772975734231953, "learning_rate": 2.223684210526316e-05, "loss": 0.3894, "loss_nan_ranks": 0, "loss_rank_avg": 0.14050891995429993, "step": 170, "valid_targets_mean": 10322.6, "valid_targets_min": 4928 }, { "epoch": 0.287986834887548, "grad_norm": 0.278650053623802, "learning_rate": 2.2894736842105263e-05, "loss": 0.3853, "loss_nan_ranks": 0, "loss_rank_avg": 0.13519951701164246, "step": 175, "valid_targets_mean": 10297.2, "valid_targets_min": 3888 }, { "epoch": 0.29621503017004935, "grad_norm": 0.2589128123009836, "learning_rate": 2.355263157894737e-05, "loss": 0.3841, "loss_nan_ranks": 0, "loss_rank_avg": 0.12493768334388733, "step": 180, "valid_targets_mean": 8726.7, "valid_targets_min": 265 }, { "epoch": 0.30444322545255076, "grad_norm": 0.29125365436187955, "learning_rate": 2.4210526315789474e-05, "loss": 0.3787, "loss_nan_ranks": 0, "loss_rank_avg": 0.11316806077957153, "step": 185, "valid_targets_mean": 8473.2, "valid_targets_min": 3703 }, { "epoch": 0.3126714207350521, "grad_norm": 0.2553461910788868, "learning_rate": 2.4868421052631583e-05, "loss": 0.3812, "loss_nan_ranks": 0, "loss_rank_avg": 0.12836065888404846, "step": 190, "valid_targets_mean": 10562.8, "valid_targets_min": 4059 }, { "epoch": 0.32089961601755346, "grad_norm": 0.33557598477032663, "learning_rate": 2.5526315789473688e-05, "loss": 0.4022, "loss_nan_ranks": 0, "loss_rank_avg": 0.13181576132774353, "step": 195, "valid_targets_mean": 5732.4, "valid_targets_min": 996 }, { "epoch": 0.32912781130005486, "grad_norm": 0.34352411636418323, "learning_rate": 2.618421052631579e-05, "loss": 0.418, "loss_nan_ranks": 0, "loss_rank_avg": 0.13641154766082764, "step": 200, "valid_targets_mean": 5909.7, "valid_targets_min": 322 }, { "epoch": 0.3373560065825562, "grad_norm": 3.4954428619882982, "learning_rate": 2.6842105263157896e-05, "loss": 0.6654, "loss_nan_ranks": 0, "loss_rank_avg": 0.34785598516464233, "step": 205, "valid_targets_mean": 3622.3, "valid_targets_min": 1417 }, { "epoch": 0.3455842018650576, "grad_norm": 1.077861726475296, "learning_rate": 2.75e-05, "loss": 0.8938, "loss_nan_ranks": 0, "loss_rank_avg": 0.3038213849067688, "step": 210, "valid_targets_mean": 4234.8, "valid_targets_min": 1229 }, { "epoch": 0.35381239714755897, "grad_norm": 0.5677105395157203, "learning_rate": 2.815789473684211e-05, "loss": 0.7774, "loss_nan_ranks": 0, "loss_rank_avg": 0.18273773789405823, "step": 215, "valid_targets_mean": 3496.8, "valid_targets_min": 792 }, { "epoch": 0.3620405924300603, "grad_norm": 0.44846475537880953, "learning_rate": 2.8815789473684215e-05, "loss": 0.8285, "loss_nan_ranks": 0, "loss_rank_avg": 0.2714836001396179, "step": 220, "valid_targets_mean": 4790.7, "valid_targets_min": 1423 }, { "epoch": 0.3702687877125617, "grad_norm": 0.3456686765451588, "learning_rate": 2.9473684210526317e-05, "loss": 0.7522, "loss_nan_ranks": 0, "loss_rank_avg": 0.28811782598495483, "step": 225, "valid_targets_mean": 4529.3, "valid_targets_min": 1236 }, { "epoch": 0.37849698299506307, "grad_norm": 0.37556290856776664, "learning_rate": 3.0131578947368423e-05, "loss": 0.7109, "loss_nan_ranks": 0, "loss_rank_avg": 0.21670036017894745, "step": 230, "valid_targets_mean": 3307.1, "valid_targets_min": 1399 }, { "epoch": 0.3867251782775645, "grad_norm": 0.33500865716540523, "learning_rate": 3.078947368421053e-05, "loss": 0.718, "loss_nan_ranks": 0, "loss_rank_avg": 0.23109467327594757, "step": 235, "valid_targets_mean": 4017.8, "valid_targets_min": 1176 }, { "epoch": 0.3949533735600658, "grad_norm": 0.31598383847429745, "learning_rate": 3.144736842105264e-05, "loss": 0.6864, "loss_nan_ranks": 0, "loss_rank_avg": 0.14081542193889618, "step": 240, "valid_targets_mean": 1564.6, "valid_targets_min": 635 }, { "epoch": 0.4031815688425672, "grad_norm": 0.3067298171268501, "learning_rate": 3.210526315789474e-05, "loss": 0.704, "loss_nan_ranks": 0, "loss_rank_avg": 0.23977398872375488, "step": 245, "valid_targets_mean": 4694.7, "valid_targets_min": 1910 }, { "epoch": 0.4114097641250686, "grad_norm": 0.34304197183917, "learning_rate": 3.276315789473684e-05, "loss": 0.6787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2708185315132141, "step": 250, "valid_targets_mean": 4543.5, "valid_targets_min": 712 }, { "epoch": 0.4196379594075699, "grad_norm": 0.3757101087371721, "learning_rate": 3.342105263157895e-05, "loss": 0.6624, "loss_nan_ranks": 0, "loss_rank_avg": 0.23688086867332458, "step": 255, "valid_targets_mean": 3509.4, "valid_targets_min": 1442 }, { "epoch": 0.42786615469007133, "grad_norm": 0.3090407246266453, "learning_rate": 3.407894736842106e-05, "loss": 0.6722, "loss_nan_ranks": 0, "loss_rank_avg": 0.1637752205133438, "step": 260, "valid_targets_mean": 3599.4, "valid_targets_min": 328 }, { "epoch": 0.4360943499725727, "grad_norm": 0.33923285458485086, "learning_rate": 3.473684210526316e-05, "loss": 0.635, "loss_nan_ranks": 0, "loss_rank_avg": 0.11224784702062607, "step": 265, "valid_targets_mean": 980.5, "valid_targets_min": 475 }, { "epoch": 0.44432254525507403, "grad_norm": 0.3392379658417928, "learning_rate": 3.539473684210526e-05, "loss": 0.6713, "loss_nan_ranks": 0, "loss_rank_avg": 0.24215322732925415, "step": 270, "valid_targets_mean": 4849.9, "valid_targets_min": 1243 }, { "epoch": 0.45255074053757544, "grad_norm": 0.3150618515035599, "learning_rate": 3.605263157894737e-05, "loss": 0.6483, "loss_nan_ranks": 0, "loss_rank_avg": 0.2192254364490509, "step": 275, "valid_targets_mean": 4380.0, "valid_targets_min": 1142 }, { "epoch": 0.4607789358200768, "grad_norm": 0.3472360677625879, "learning_rate": 3.671052631578948e-05, "loss": 0.6846, "loss_nan_ranks": 0, "loss_rank_avg": 0.2536545991897583, "step": 280, "valid_targets_mean": 3904.7, "valid_targets_min": 1187 }, { "epoch": 0.4690071311025782, "grad_norm": 0.3156614973458573, "learning_rate": 3.736842105263158e-05, "loss": 0.6585, "loss_nan_ranks": 0, "loss_rank_avg": 0.1983037143945694, "step": 285, "valid_targets_mean": 3962.2, "valid_targets_min": 1010 }, { "epoch": 0.47723532638507954, "grad_norm": 0.37742389790153924, "learning_rate": 3.802631578947369e-05, "loss": 0.6333, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320263296365738, "step": 290, "valid_targets_mean": 1099.3, "valid_targets_min": 280 }, { "epoch": 0.4854635216675809, "grad_norm": 0.2962337727307249, "learning_rate": 3.868421052631579e-05, "loss": 0.6569, "loss_nan_ranks": 0, "loss_rank_avg": 0.246580570936203, "step": 295, "valid_targets_mean": 5050.1, "valid_targets_min": 1178 }, { "epoch": 0.4936917169500823, "grad_norm": 0.2856275355602754, "learning_rate": 3.9342105263157895e-05, "loss": 0.6432, "loss_nan_ranks": 0, "loss_rank_avg": 0.2303171455860138, "step": 300, "valid_targets_mean": 5151.1, "valid_targets_min": 1346 }, { "epoch": 0.5019199122325837, "grad_norm": 0.33300122404573673, "learning_rate": 4e-05, "loss": 0.4498, "loss_nan_ranks": 0, "loss_rank_avg": 0.08987970650196075, "step": 305, "valid_targets_mean": 5515.5, "valid_targets_min": 1936 }, { "epoch": 0.510148107515085, "grad_norm": 0.29692627282197165, "learning_rate": 3.999967038544942e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.07394493371248245, "step": 310, "valid_targets_mean": 5127.6, "valid_targets_min": 2180 }, { "epoch": 0.5183763027975864, "grad_norm": 0.25936222317294383, "learning_rate": 3.9998681552662254e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.06937037408351898, "step": 315, "valid_targets_mean": 5021.8, "valid_targets_min": 2808 }, { "epoch": 0.5266044980800878, "grad_norm": 0.3327155662385847, "learning_rate": 3.999703353423185e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.072842076420784, "step": 320, "valid_targets_mean": 5327.4, "valid_targets_min": 2771 }, { "epoch": 0.5348326933625891, "grad_norm": 0.2504539380850954, "learning_rate": 3.999472638447933e-05, "loss": 0.2143, "loss_nan_ranks": 0, "loss_rank_avg": 0.07985015213489532, "step": 325, "valid_targets_mean": 5568.0, "valid_targets_min": 3219 }, { "epoch": 0.5430608886450905, "grad_norm": 0.2814701429958317, "learning_rate": 3.999176017945168e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.06997586786746979, "step": 330, "valid_targets_mean": 5279.6, "valid_targets_min": 3339 }, { "epoch": 0.5512890839275919, "grad_norm": 0.23889431711323486, "learning_rate": 3.998813501691934e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.06921573728322983, "step": 335, "valid_targets_mean": 5462.8, "valid_targets_min": 1825 }, { "epoch": 0.5595172792100932, "grad_norm": 0.2620420014965469, "learning_rate": 3.9983851016372945e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.06677880883216858, "step": 340, "valid_targets_mean": 5447.9, "valid_targets_min": 2456 }, { "epoch": 0.5677454744925946, "grad_norm": 0.2222928848241994, "learning_rate": 3.997890831901938e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.06969676911830902, "step": 345, "valid_targets_mean": 5365.3, "valid_targets_min": 2902 }, { "epoch": 0.575973669775096, "grad_norm": 0.24107676881576715, "learning_rate": 3.997330708777714e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.06276493519544601, "step": 350, "valid_targets_mean": 4987.0, "valid_targets_min": 3287 }, { "epoch": 0.5842018650575974, "grad_norm": 0.21062109587656125, "learning_rate": 3.996704750727097e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.05960414931178093, "step": 355, "valid_targets_mean": 5047.8, "valid_targets_min": 2252 }, { "epoch": 0.5924300603400987, "grad_norm": 0.2165529180549222, "learning_rate": 3.9960129783825746e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.07164271175861359, "step": 360, "valid_targets_mean": 5323.9, "valid_targets_min": 2401 }, { "epoch": 0.6006582556226001, "grad_norm": 0.2602414889343082, "learning_rate": 3.995255414545969e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.06296073645353317, "step": 365, "valid_targets_mean": 5421.0, "valid_targets_min": 916 }, { "epoch": 0.6088864509051015, "grad_norm": 0.22113365838524923, "learning_rate": 3.994432084187688e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.05878105387091637, "step": 370, "valid_targets_mean": 5157.3, "valid_targets_min": 2787 }, { "epoch": 0.6171146461876028, "grad_norm": 0.2726984781426435, "learning_rate": 3.993543014445897e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.06641367077827454, "step": 375, "valid_targets_mean": 5285.9, "valid_targets_min": 2725 }, { "epoch": 0.6253428414701042, "grad_norm": 0.24103613454295666, "learning_rate": 3.992588234625629e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.06343524158000946, "step": 380, "valid_targets_mean": 4471.1, "valid_targets_min": 773 }, { "epoch": 0.6335710367526056, "grad_norm": 0.23661985213609446, "learning_rate": 3.991567776197815e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.06470175087451935, "step": 385, "valid_targets_mean": 5323.2, "valid_targets_min": 3113 }, { "epoch": 0.6417992320351069, "grad_norm": 0.2365355448830919, "learning_rate": 3.990481672798251e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.06568753719329834, "step": 390, "valid_targets_mean": 5507.8, "valid_targets_min": 3054 }, { "epoch": 0.6500274273176083, "grad_norm": 0.250970116784741, "learning_rate": 3.989329960226486e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.06060680001974106, "step": 395, "valid_targets_mean": 5065.1, "valid_targets_min": 2739 }, { "epoch": 0.6582556226001097, "grad_norm": 0.24890957035716, "learning_rate": 3.988112676444639e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.06493669748306274, "step": 400, "valid_targets_mean": 5267.3, "valid_targets_min": 3285 }, { "epoch": 0.6664838178826111, "grad_norm": 0.2123920671176028, "learning_rate": 3.9868298615761586e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.06611112505197525, "step": 405, "valid_targets_mean": 5350.7, "valid_targets_min": 2809 }, { "epoch": 0.6747120131651124, "grad_norm": 0.45669439712276166, "learning_rate": 3.9854815579044866e-05, "loss": 0.5087, "loss_nan_ranks": 0, "loss_rank_avg": 0.1900215744972229, "step": 410, "valid_targets_mean": 4092.8, "valid_targets_min": 1262 }, { "epoch": 0.6829402084476138, "grad_norm": 0.34680859400827757, "learning_rate": 3.984067809871675e-05, "loss": 0.5508, "loss_nan_ranks": 0, "loss_rank_avg": 0.1873103380203247, "step": 415, "valid_targets_mean": 3959.6, "valid_targets_min": 922 }, { "epoch": 0.6911684037301152, "grad_norm": 0.33789768611131743, "learning_rate": 3.982588664076916e-05, "loss": 0.5498, "loss_nan_ranks": 0, "loss_rank_avg": 0.172877237200737, "step": 420, "valid_targets_mean": 3500.9, "valid_targets_min": 1193 }, { "epoch": 0.6993965990126165, "grad_norm": 0.3422411868231782, "learning_rate": 3.981044169275006e-05, "loss": 0.5395, "loss_nan_ranks": 0, "loss_rank_avg": 0.16920597851276398, "step": 425, "valid_targets_mean": 3293.8, "valid_targets_min": 1211 }, { "epoch": 0.7076247942951179, "grad_norm": 0.2819763328446606, "learning_rate": 3.979434376374744e-05, "loss": 0.5325, "loss_nan_ranks": 0, "loss_rank_avg": 0.19173139333724976, "step": 430, "valid_targets_mean": 4374.8, "valid_targets_min": 1271 }, { "epoch": 0.7158529895776193, "grad_norm": 0.3302657868370585, "learning_rate": 3.9777593384372436e-05, "loss": 0.5511, "loss_nan_ranks": 0, "loss_rank_avg": 0.15441164374351501, "step": 435, "valid_targets_mean": 2742.0, "valid_targets_min": 1163 }, { "epoch": 0.7240811848601206, "grad_norm": 0.36559426634652425, "learning_rate": 3.9760191106741935e-05, "loss": 0.525, "loss_nan_ranks": 0, "loss_rank_avg": 0.17873308062553406, "step": 440, "valid_targets_mean": 2944.6, "valid_targets_min": 747 }, { "epoch": 0.732309380142622, "grad_norm": 0.29776253451819223, "learning_rate": 3.9742137504460326e-05, "loss": 0.4966, "loss_nan_ranks": 0, "loss_rank_avg": 0.09976305067539215, "step": 445, "valid_targets_mean": 1390.7, "valid_targets_min": 617 }, { "epoch": 0.7405375754251234, "grad_norm": 0.2741654148501185, "learning_rate": 3.972343317260061e-05, "loss": 0.556, "loss_nan_ranks": 0, "loss_rank_avg": 0.20187368988990784, "step": 450, "valid_targets_mean": 5282.3, "valid_targets_min": 1416 }, { "epoch": 0.7487657707076248, "grad_norm": 0.29327103026837464, "learning_rate": 3.970407872768478e-05, "loss": 0.5153, "loss_nan_ranks": 0, "loss_rank_avg": 0.21182456612586975, "step": 455, "valid_targets_mean": 5102.7, "valid_targets_min": 635 }, { "epoch": 0.7569939659901261, "grad_norm": 0.3027137360580798, "learning_rate": 3.968407480766352e-05, "loss": 0.5377, "loss_nan_ranks": 0, "loss_rank_avg": 0.17653965950012207, "step": 460, "valid_targets_mean": 4471.8, "valid_targets_min": 1166 }, { "epoch": 0.7652221612726275, "grad_norm": 0.3131357916514081, "learning_rate": 3.9663422071895103e-05, "loss": 0.5099, "loss_nan_ranks": 0, "loss_rank_avg": 0.1851877123117447, "step": 465, "valid_targets_mean": 3015.3, "valid_targets_min": 644 }, { "epoch": 0.773450356555129, "grad_norm": 0.30585055011385276, "learning_rate": 3.964212120112379e-05, "loss": 0.5066, "loss_nan_ranks": 0, "loss_rank_avg": 0.16202497482299805, "step": 470, "valid_targets_mean": 4168.5, "valid_targets_min": 1159 }, { "epoch": 0.7816785518376302, "grad_norm": 0.3185891945520371, "learning_rate": 3.962017289745724e-05, "loss": 0.5529, "loss_nan_ranks": 0, "loss_rank_avg": 0.18970099091529846, "step": 475, "valid_targets_mean": 4139.7, "valid_targets_min": 1171 }, { "epoch": 0.7899067471201316, "grad_norm": 0.3193022031463681, "learning_rate": 3.959757788434351e-05, "loss": 0.5281, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599006950855255, "step": 480, "valid_targets_mean": 3524.7, "valid_targets_min": 706 }, { "epoch": 0.798134942402633, "grad_norm": 0.47454037589519754, "learning_rate": 3.957433690654709e-05, "loss": 0.5262, "loss_nan_ranks": 0, "loss_rank_avg": 0.13566067814826965, "step": 485, "valid_targets_mean": 974.1, "valid_targets_min": 373 }, { "epoch": 0.8063631376851343, "grad_norm": 0.27137258308574463, "learning_rate": 3.955045073012443e-05, "loss": 0.5126, "loss_nan_ranks": 0, "loss_rank_avg": 0.1551508903503418, "step": 490, "valid_targets_mean": 4034.9, "valid_targets_min": 1413 }, { "epoch": 0.8145913329676358, "grad_norm": 0.2891185235274737, "learning_rate": 3.952592014239867e-05, "loss": 0.5201, "loss_nan_ranks": 0, "loss_rank_avg": 0.18325182795524597, "step": 495, "valid_targets_mean": 4597.8, "valid_targets_min": 1386 }, { "epoch": 0.8228195282501372, "grad_norm": 0.30627166767474445, "learning_rate": 3.950074595193366e-05, "loss": 0.5038, "loss_nan_ranks": 0, "loss_rank_avg": 0.14900541305541992, "step": 500, "valid_targets_mean": 3344.0, "valid_targets_min": 1074 }, { "epoch": 0.8310477235326386, "grad_norm": 0.2910945730347226, "learning_rate": 3.947492898850736e-05, "loss": 0.5297, "loss_nan_ranks": 0, "loss_rank_avg": 0.2500567138195038, "step": 505, "valid_targets_mean": 4781.9, "valid_targets_min": 1038 }, { "epoch": 0.8392759188151399, "grad_norm": 0.28859181669258777, "learning_rate": 3.9448470103084436e-05, "loss": 0.5061, "loss_nan_ranks": 0, "loss_rank_avg": 0.14351779222488403, "step": 510, "valid_targets_mean": 4052.2, "valid_targets_min": 1148 }, { "epoch": 0.8475041140976413, "grad_norm": 0.2849202691210404, "learning_rate": 3.942137016778826e-05, "loss": 0.4405, "loss_nan_ranks": 0, "loss_rank_avg": 0.09605582058429718, "step": 515, "valid_targets_mean": 5513.2, "valid_targets_min": 260 }, { "epoch": 0.8557323093801427, "grad_norm": 0.24873959226778644, "learning_rate": 3.939363007587213e-05, "loss": 0.3552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327248215675354, "step": 520, "valid_targets_mean": 6674.3, "valid_targets_min": 667 }, { "epoch": 0.863960504662644, "grad_norm": 0.2519692215563831, "learning_rate": 3.9365250741689835e-05, "loss": 0.3647, "loss_nan_ranks": 0, "loss_rank_avg": 0.11264800280332565, "step": 525, "valid_targets_mean": 5004.6, "valid_targets_min": 184 }, { "epoch": 0.8721886999451454, "grad_norm": 0.2342060171912288, "learning_rate": 3.933623310066554e-05, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.11143757402896881, "step": 530, "valid_targets_mean": 6059.3, "valid_targets_min": 496 }, { "epoch": 0.8804168952276468, "grad_norm": 0.271362287684106, "learning_rate": 3.9306578109262894e-05, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.05567864701151848, "step": 535, "valid_targets_mean": 1604.8, "valid_targets_min": 520 }, { "epoch": 0.8886450905101481, "grad_norm": 0.2597578802375837, "learning_rate": 3.927628674495357e-05, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.09169554710388184, "step": 540, "valid_targets_mean": 6672.8, "valid_targets_min": 750 }, { "epoch": 0.8968732857926495, "grad_norm": 0.21749824898637793, "learning_rate": 3.924536000618501e-05, "loss": 0.3249, "loss_nan_ranks": 0, "loss_rank_avg": 0.10265297442674637, "step": 545, "valid_targets_mean": 5849.8, "valid_targets_min": 225 }, { "epoch": 0.9051014810751509, "grad_norm": 0.2241552515651752, "learning_rate": 3.921379891234753e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.11423005163669586, "step": 550, "valid_targets_mean": 6783.3, "valid_targets_min": 643 }, { "epoch": 0.9133296763576523, "grad_norm": 0.2158340366537389, "learning_rate": 3.9181604503740714e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.09704571962356567, "step": 555, "valid_targets_mean": 6440.8, "valid_targets_min": 392 }, { "epoch": 0.9215578716401536, "grad_norm": 0.26183611514857996, "learning_rate": 3.914877784153909e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.17041084170341492, "step": 560, "valid_targets_mean": 8714.9, "valid_targets_min": 1646 }, { "epoch": 0.929786066922655, "grad_norm": 0.20432961383680928, "learning_rate": 3.9115320007757225e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.0803799033164978, "step": 565, "valid_targets_mean": 6242.6, "valid_targets_min": 1338 }, { "epoch": 0.9380142622051564, "grad_norm": 0.2092825817868237, "learning_rate": 3.9081232105214e-05, "loss": 0.3229, "loss_nan_ranks": 0, "loss_rank_avg": 0.13302992284297943, "step": 570, "valid_targets_mean": 7600.2, "valid_targets_min": 399 }, { "epoch": 0.9462424574876577, "grad_norm": 0.19714866749443535, "learning_rate": 3.9046515257496295e-05, "loss": 0.3387, "loss_nan_ranks": 0, "loss_rank_avg": 0.0796457827091217, "step": 575, "valid_targets_mean": 6031.7, "valid_targets_min": 993 }, { "epoch": 0.9544706527701591, "grad_norm": 0.20932629070373632, "learning_rate": 3.9011170608921904e-05, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.09574976563453674, "step": 580, "valid_targets_mean": 6480.3, "valid_targets_min": 279 }, { "epoch": 0.9626988480526605, "grad_norm": 0.19884348922834869, "learning_rate": 3.897519932450189e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.08668152987957001, "step": 585, "valid_targets_mean": 6095.1, "valid_targets_min": 1420 }, { "epoch": 0.9709270433351618, "grad_norm": 0.1916490209833201, "learning_rate": 3.893860258990212e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.09876567125320435, "step": 590, "valid_targets_mean": 6487.8, "valid_targets_min": 491 }, { "epoch": 0.9791552386176632, "grad_norm": 0.24087156746724506, "learning_rate": 3.890138161140421e-05, "loss": 0.2973, "loss_nan_ranks": 0, "loss_rank_avg": 0.08016130328178406, "step": 595, "valid_targets_mean": 1157.9, "valid_targets_min": 493 }, { "epoch": 0.9873834339001646, "grad_norm": 0.21112403994094667, "learning_rate": 3.886353761586579e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.10186732560396194, "step": 600, "valid_targets_mean": 6671.6, "valid_targets_min": 354 }, { "epoch": 0.9956116291826659, "grad_norm": 0.20983694665510674, "learning_rate": 3.8825071850679996e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.12147838622331619, "step": 605, "valid_targets_mean": 7020.9, "valid_targets_min": 848 }, { "epoch": 1.0032912781130006, "grad_norm": 1.659397044858526, "learning_rate": 3.878598558373443e-05, "loss": 0.5467, "loss_nan_ranks": 0, "loss_rank_avg": 0.18808016180992126, "step": 610, "valid_targets_mean": 6370.5, "valid_targets_min": 2089 }, { "epoch": 1.011519473395502, "grad_norm": 0.7209332976643361, "learning_rate": 3.874628010336932e-05, "loss": 0.5739, "loss_nan_ranks": 0, "loss_rank_avg": 0.20240893959999084, "step": 615, "valid_targets_mean": 7651.2, "valid_targets_min": 2581 }, { "epoch": 1.0197476686780034, "grad_norm": 0.4882521280358526, "learning_rate": 3.870595671833508e-05, "loss": 0.5011, "loss_nan_ranks": 0, "loss_rank_avg": 0.16959220170974731, "step": 620, "valid_targets_mean": 7917.3, "valid_targets_min": 2931 }, { "epoch": 1.0279758639605046, "grad_norm": 0.3524983441886274, "learning_rate": 3.866501675774914e-05, "loss": 0.4729, "loss_nan_ranks": 0, "loss_rank_avg": 0.16359078884124756, "step": 625, "valid_targets_mean": 7465.7, "valid_targets_min": 1655 }, { "epoch": 1.036204059243006, "grad_norm": 0.285845283172002, "learning_rate": 3.862346157105219e-05, "loss": 0.444, "loss_nan_ranks": 0, "loss_rank_avg": 0.13884960114955902, "step": 630, "valid_targets_mean": 6986.5, "valid_targets_min": 2745 }, { "epoch": 1.0444322545255074, "grad_norm": 0.2637082715943371, "learning_rate": 3.858129252796363e-05, "loss": 0.4377, "loss_nan_ranks": 0, "loss_rank_avg": 0.12356004118919373, "step": 635, "valid_targets_mean": 6226.8, "valid_targets_min": 2078 }, { "epoch": 1.0526604498080088, "grad_norm": 0.28887382496755204, "learning_rate": 3.853851101843649e-05, "loss": 0.4291, "loss_nan_ranks": 0, "loss_rank_avg": 0.12742659449577332, "step": 640, "valid_targets_mean": 6504.0, "valid_targets_min": 3466 }, { "epoch": 1.0608886450905102, "grad_norm": 0.24476017136685832, "learning_rate": 3.8495118452611574e-05, "loss": 0.4201, "loss_nan_ranks": 0, "loss_rank_avg": 0.14294564723968506, "step": 645, "valid_targets_mean": 7776.8, "valid_targets_min": 2749 }, { "epoch": 1.0691168403730116, "grad_norm": 0.2726802244958609, "learning_rate": 3.845111626077097e-05, "loss": 0.4119, "loss_nan_ranks": 0, "loss_rank_avg": 0.12050601094961166, "step": 650, "valid_targets_mean": 6354.8, "valid_targets_min": 1941 }, { "epoch": 1.077345035655513, "grad_norm": 0.2773725725381812, "learning_rate": 3.840650589329098e-05, "loss": 0.4111, "loss_nan_ranks": 0, "loss_rank_avg": 0.1138051226735115, "step": 655, "valid_targets_mean": 6384.4, "valid_targets_min": 2441 }, { "epoch": 1.0855732309380142, "grad_norm": 0.26559994898000056, "learning_rate": 3.83612888205942e-05, "loss": 0.4077, "loss_nan_ranks": 0, "loss_rank_avg": 0.13822872936725616, "step": 660, "valid_targets_mean": 7465.9, "valid_targets_min": 2228 }, { "epoch": 1.0938014262205156, "grad_norm": 0.22208110131792275, "learning_rate": 3.8315466533101154e-05, "loss": 0.3852, "loss_nan_ranks": 0, "loss_rank_avg": 0.11882581561803818, "step": 665, "valid_targets_mean": 8703.7, "valid_targets_min": 4392 }, { "epoch": 1.102029621503017, "grad_norm": 0.21922616622876517, "learning_rate": 3.82690405411811e-05, "loss": 0.3758, "loss_nan_ranks": 0, "loss_rank_avg": 0.11796137690544128, "step": 670, "valid_targets_mean": 9525.9, "valid_targets_min": 3807 }, { "epoch": 1.1102578167855184, "grad_norm": 0.2335012875150806, "learning_rate": 3.82220123751023e-05, "loss": 0.3727, "loss_nan_ranks": 0, "loss_rank_avg": 0.12342832237482071, "step": 675, "valid_targets_mean": 8976.7, "valid_targets_min": 2713 }, { "epoch": 1.1184860120680198, "grad_norm": 0.20615998005456446, "learning_rate": 3.8174383584981525e-05, "loss": 0.3683, "loss_nan_ranks": 0, "loss_rank_avg": 0.12510226666927338, "step": 680, "valid_targets_mean": 9808.0, "valid_targets_min": 5333 }, { "epoch": 1.1267142073505212, "grad_norm": 0.20549746954269069, "learning_rate": 3.812615574073301e-05, "loss": 0.3675, "loss_nan_ranks": 0, "loss_rank_avg": 0.11540381610393524, "step": 685, "valid_targets_mean": 8583.8, "valid_targets_min": 2662 }, { "epoch": 1.1349424026330226, "grad_norm": 0.354746331129916, "learning_rate": 3.807733043201666e-05, "loss": 0.3624, "loss_nan_ranks": 0, "loss_rank_avg": 0.11764580011367798, "step": 690, "valid_targets_mean": 8976.7, "valid_targets_min": 899 }, { "epoch": 1.1431705979155238, "grad_norm": 0.22026383511742792, "learning_rate": 3.8027909268185695e-05, "loss": 0.3701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1217566654086113, "step": 695, "valid_targets_mean": 8862.6, "valid_targets_min": 363 }, { "epoch": 1.1513987931980252, "grad_norm": 0.24232587865327862, "learning_rate": 3.7977893878233604e-05, "loss": 0.3592, "loss_nan_ranks": 0, "loss_rank_avg": 0.12140684574842453, "step": 700, "valid_targets_mean": 9068.4, "valid_targets_min": 532 }, { "epoch": 1.1596269884805266, "grad_norm": 0.21509299959913547, "learning_rate": 3.792728591074041e-05, "loss": 0.3619, "loss_nan_ranks": 0, "loss_rank_avg": 0.12871021032333374, "step": 705, "valid_targets_mean": 10089.5, "valid_targets_min": 5419 }, { "epoch": 1.167855183763028, "grad_norm": 0.231174997822983, "learning_rate": 3.7876087033818345e-05, "loss": 0.3584, "loss_nan_ranks": 0, "loss_rank_avg": 0.11500117927789688, "step": 710, "valid_targets_mean": 9003.8, "valid_targets_min": 387 }, { "epoch": 1.1760833790455294, "grad_norm": 0.22555157163732995, "learning_rate": 3.78242989350569e-05, "loss": 0.3579, "loss_nan_ranks": 0, "loss_rank_avg": 0.12305817008018494, "step": 715, "valid_targets_mean": 10012.9, "valid_targets_min": 5197 }, { "epoch": 1.1843115743280308, "grad_norm": 0.23487162908677478, "learning_rate": 3.7771923321467163e-05, "loss": 0.3555, "loss_nan_ranks": 0, "loss_rank_avg": 0.12105908989906311, "step": 720, "valid_targets_mean": 9826.7, "valid_targets_min": 464 }, { "epoch": 1.1925397696105322, "grad_norm": 0.2517013646791283, "learning_rate": 3.771896191942556e-05, "loss": 0.3526, "loss_nan_ranks": 0, "loss_rank_avg": 0.10659809410572052, "step": 725, "valid_targets_mean": 8842.1, "valid_targets_min": 4239 }, { "epoch": 1.2007679648930334, "grad_norm": 0.2156644331644718, "learning_rate": 3.7665416474616986e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.10782045125961304, "step": 730, "valid_targets_mean": 9048.3, "valid_targets_min": 5085 }, { "epoch": 1.2089961601755348, "grad_norm": 0.26346428818115725, "learning_rate": 3.761128875197719e-05, "loss": 0.362, "loss_nan_ranks": 0, "loss_rank_avg": 0.11525176465511322, "step": 735, "valid_targets_mean": 9484.0, "valid_targets_min": 4512 }, { "epoch": 1.2172243554580362, "grad_norm": 0.22755907847000245, "learning_rate": 3.7556580535634685e-05, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.11937953531742096, "step": 740, "valid_targets_mean": 9844.3, "valid_targets_min": 3863 }, { "epoch": 1.2254525507405376, "grad_norm": 0.22714801320069883, "learning_rate": 3.750129362885188e-05, "loss": 0.3469, "loss_nan_ranks": 0, "loss_rank_avg": 0.10537885129451752, "step": 745, "valid_targets_mean": 9963.1, "valid_targets_min": 5225 }, { "epoch": 1.233680746023039, "grad_norm": 0.2147068269485451, "learning_rate": 3.744542985396566e-05, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.10538201034069061, "step": 750, "valid_targets_mean": 9133.7, "valid_targets_min": 2782 }, { "epoch": 1.2419089413055404, "grad_norm": 0.22999817220649277, "learning_rate": 3.738899105232734e-05, "loss": 0.3524, "loss_nan_ranks": 0, "loss_rank_avg": 0.12429474294185638, "step": 755, "valid_targets_mean": 9841.2, "valid_targets_min": 885 }, { "epoch": 1.2501371365880418, "grad_norm": 0.2182279465433469, "learning_rate": 3.733197908424194e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.10498598963022232, "step": 760, "valid_targets_mean": 9260.1, "valid_targets_min": 378 }, { "epoch": 1.258365331870543, "grad_norm": 0.2176991000254134, "learning_rate": 3.727439582890689e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.11775383353233337, "step": 765, "valid_targets_mean": 9212.2, "valid_targets_min": 3467 }, { "epoch": 1.2665935271530444, "grad_norm": 0.22474069393548862, "learning_rate": 3.721624318435006e-05, "loss": 0.3442, "loss_nan_ranks": 0, "loss_rank_avg": 0.11866054683923721, "step": 770, "valid_targets_mean": 10565.9, "valid_targets_min": 723 }, { "epoch": 1.2748217224355458, "grad_norm": 0.3553450372737768, "learning_rate": 3.715752306736724e-05, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.11934887617826462, "step": 775, "valid_targets_mean": 10235.8, "valid_targets_min": 5141 }, { "epoch": 1.2830499177180472, "grad_norm": 0.24117058830790514, "learning_rate": 3.709823741345894e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.12090543657541275, "step": 780, "valid_targets_mean": 10594.5, "valid_targets_min": 4701 }, { "epoch": 1.2912781130005486, "grad_norm": 0.27672367825987276, "learning_rate": 3.703838817676654e-05, "loss": 0.3399, "loss_nan_ranks": 0, "loss_rank_avg": 0.1089012622833252, "step": 785, "valid_targets_mean": 9161.7, "valid_targets_min": 3022 }, { "epoch": 1.2995063082830498, "grad_norm": 0.21099639116289254, "learning_rate": 3.6977977330008e-05, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.1100674569606781, "step": 790, "valid_targets_mean": 9593.7, "valid_targets_min": 5120 }, { "epoch": 1.3077345035655512, "grad_norm": 0.27202881396330664, "learning_rate": 3.691700686441272e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.10544559359550476, "step": 795, "valid_targets_mean": 9896.2, "valid_targets_min": 3759 }, { "epoch": 1.3159626988480526, "grad_norm": 0.29008227740554365, "learning_rate": 3.685547878965595e-05, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.11258372664451599, "step": 800, "valid_targets_mean": 9676.5, "valid_targets_min": 4171 }, { "epoch": 1.324190894130554, "grad_norm": 0.2648068230573467, "learning_rate": 3.679339513379257e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.11481667309999466, "step": 805, "valid_targets_mean": 6269.3, "valid_targets_min": 470 }, { "epoch": 1.3324190894130554, "grad_norm": 0.3302755564975962, "learning_rate": 3.673075794319022e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273985505104065, "step": 810, "valid_targets_mean": 6197.9, "valid_targets_min": 350 }, { "epoch": 1.3406472846955568, "grad_norm": 0.9946048795797314, "learning_rate": 3.6667569282461835e-05, "loss": 0.7179, "loss_nan_ranks": 0, "loss_rank_avg": 0.29462897777557373, "step": 815, "valid_targets_mean": 5028.6, "valid_targets_min": 935 }, { "epoch": 1.3488754799780582, "grad_norm": 0.5672650836141364, "learning_rate": 3.660383123439761e-05, "loss": 0.6726, "loss_nan_ranks": 0, "loss_rank_avg": 0.1995016634464264, "step": 820, "valid_targets_mean": 3933.0, "valid_targets_min": 797 }, { "epoch": 1.3571036752605594, "grad_norm": 0.42579660991027274, "learning_rate": 3.653954589989637e-05, "loss": 0.6596, "loss_nan_ranks": 0, "loss_rank_avg": 0.18716245889663696, "step": 825, "valid_targets_mean": 3912.4, "valid_targets_min": 1137 }, { "epoch": 1.3653318705430608, "grad_norm": 0.30342608710540986, "learning_rate": 3.647471539789626e-05, "loss": 0.6193, "loss_nan_ranks": 0, "loss_rank_avg": 0.2176496684551239, "step": 830, "valid_targets_mean": 3427.5, "valid_targets_min": 570 }, { "epoch": 1.3735600658255622, "grad_norm": 0.2692438365384602, "learning_rate": 3.640934186530496e-05, "loss": 0.612, "loss_nan_ranks": 0, "loss_rank_avg": 0.17222759127616882, "step": 835, "valid_targets_mean": 4285.9, "valid_targets_min": 1385 }, { "epoch": 1.3817882611080636, "grad_norm": 0.3252340214730497, "learning_rate": 3.634342745692924e-05, "loss": 0.6096, "loss_nan_ranks": 0, "loss_rank_avg": 0.23037424683570862, "step": 840, "valid_targets_mean": 4571.2, "valid_targets_min": 1195 }, { "epoch": 1.390016456390565, "grad_norm": 0.283339399288758, "learning_rate": 3.62769743454039e-05, "loss": 0.5952, "loss_nan_ranks": 0, "loss_rank_avg": 0.17118248343467712, "step": 845, "valid_targets_mean": 3360.0, "valid_targets_min": 791 }, { "epoch": 1.3982446516730664, "grad_norm": 0.2935408435366708, "learning_rate": 3.6209984721120195e-05, "loss": 0.6073, "loss_nan_ranks": 0, "loss_rank_avg": 0.18600332736968994, "step": 850, "valid_targets_mean": 3748.8, "valid_targets_min": 1312 }, { "epoch": 1.4064728469555678, "grad_norm": 0.2785551163427506, "learning_rate": 3.614246079215361e-05, "loss": 0.5841, "loss_nan_ranks": 0, "loss_rank_avg": 0.2570624053478241, "step": 855, "valid_targets_mean": 4315.9, "valid_targets_min": 858 }, { "epoch": 1.414701042238069, "grad_norm": 0.2571094312626162, "learning_rate": 3.6074404784191084e-05, "loss": 0.5723, "loss_nan_ranks": 0, "loss_rank_avg": 0.2021176815032959, "step": 860, "valid_targets_mean": 5165.7, "valid_targets_min": 1332 }, { "epoch": 1.4229292375205704, "grad_norm": 0.29270135824966964, "learning_rate": 3.600581894045768e-05, "loss": 0.5871, "loss_nan_ranks": 0, "loss_rank_avg": 0.17256325483322144, "step": 865, "valid_targets_mean": 4124.3, "valid_targets_min": 1668 }, { "epoch": 1.4311574328030718, "grad_norm": 0.2943443689190457, "learning_rate": 3.593670552164261e-05, "loss": 0.5814, "loss_nan_ranks": 0, "loss_rank_avg": 0.19908928871154785, "step": 870, "valid_targets_mean": 4181.1, "valid_targets_min": 897 }, { "epoch": 1.4393856280855732, "grad_norm": 0.30602158217934583, "learning_rate": 3.586706680582471e-05, "loss": 0.5616, "loss_nan_ranks": 0, "loss_rank_avg": 0.17146259546279907, "step": 875, "valid_targets_mean": 3683.8, "valid_targets_min": 1300 }, { "epoch": 1.4476138233680746, "grad_norm": 0.2818001970674873, "learning_rate": 3.579690508839738e-05, "loss": 0.5933, "loss_nan_ranks": 0, "loss_rank_avg": 0.2810094952583313, "step": 880, "valid_targets_mean": 4964.7, "valid_targets_min": 906 }, { "epoch": 1.455842018650576, "grad_norm": 0.26338390068846385, "learning_rate": 3.572622268199292e-05, "loss": 0.5654, "loss_nan_ranks": 0, "loss_rank_avg": 0.1930113285779953, "step": 885, "valid_targets_mean": 4663.9, "valid_targets_min": 1014 }, { "epoch": 1.4640702139330775, "grad_norm": 0.2852703233091329, "learning_rate": 3.5655021916406295e-05, "loss": 0.6099, "loss_nan_ranks": 0, "loss_rank_avg": 0.20813152194023132, "step": 890, "valid_targets_mean": 5404.8, "valid_targets_min": 1229 }, { "epoch": 1.4722984092155786, "grad_norm": 0.28634164602408574, "learning_rate": 3.558330513851833e-05, "loss": 0.5761, "loss_nan_ranks": 0, "loss_rank_avg": 0.18061956763267517, "step": 895, "valid_targets_mean": 4281.5, "valid_targets_min": 1057 }, { "epoch": 1.48052660449808, "grad_norm": 0.3363155802523227, "learning_rate": 3.55110747122184e-05, "loss": 0.5784, "loss_nan_ranks": 0, "loss_rank_avg": 0.21961042284965515, "step": 900, "valid_targets_mean": 4570.4, "valid_targets_min": 1376 }, { "epoch": 1.4887547997805815, "grad_norm": 0.3152139088458827, "learning_rate": 3.543833301832642e-05, "loss": 0.591, "loss_nan_ranks": 0, "loss_rank_avg": 0.21911880373954773, "step": 905, "valid_targets_mean": 4505.6, "valid_targets_min": 1222 }, { "epoch": 1.4969829950630829, "grad_norm": 0.2725299656670677, "learning_rate": 3.5365082454514493e-05, "loss": 0.5635, "loss_nan_ranks": 0, "loss_rank_avg": 0.155883327126503, "step": 910, "valid_targets_mean": 4379.0, "valid_targets_min": 558 }, { "epoch": 1.5052111903455843, "grad_norm": 0.3099063769029409, "learning_rate": 3.529132543522777e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.062484048306941986, "step": 915, "valid_targets_mean": 5018.2, "valid_targets_min": 2523 }, { "epoch": 1.5134393856280854, "grad_norm": 0.24229893596824933, "learning_rate": 3.521706439160494e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.05739575996994972, "step": 920, "valid_targets_mean": 5262.3, "valid_targets_min": 2967 }, { "epoch": 1.521667580910587, "grad_norm": 0.22759412709293747, "learning_rate": 3.514230177139805e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.05191062390804291, "step": 925, "valid_targets_mean": 5112.8, "valid_targets_min": 3095 }, { "epoch": 1.5298957761930883, "grad_norm": 0.2099880413854461, "learning_rate": 3.5067040038891834e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.054002054035663605, "step": 930, "valid_targets_mean": 5352.1, "valid_targets_min": 2034 }, { "epoch": 1.5381239714755897, "grad_norm": 0.211986257010731, "learning_rate": 3.499128167482253e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.059163033962249756, "step": 935, "valid_targets_mean": 5610.1, "valid_targets_min": 3069 }, { "epoch": 1.546352166758091, "grad_norm": 0.20019735272394734, "learning_rate": 3.491502917629602e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.05470460653305054, "step": 940, "valid_targets_mean": 5206.3, "valid_targets_min": 3294 }, { "epoch": 1.5545803620405925, "grad_norm": 0.22719278970124465, "learning_rate": 3.483828505670563e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.05662545561790466, "step": 945, "valid_targets_mean": 5573.9, "valid_targets_min": 1997 }, { "epoch": 1.5628085573230939, "grad_norm": 0.20264846243090592, "learning_rate": 3.476105184564921e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.05749613046646118, "step": 950, "valid_targets_mean": 5469.3, "valid_targets_min": 3506 }, { "epoch": 1.571036752605595, "grad_norm": 0.19906120158231985, "learning_rate": 3.468333208884576e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.056417644023895264, "step": 955, "valid_targets_mean": 5436.2, "valid_targets_min": 2886 }, { "epoch": 1.5792649478880967, "grad_norm": 0.21488228662363817, "learning_rate": 3.4605128348051566e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.06093878298997879, "step": 960, "valid_targets_mean": 5540.5, "valid_targets_min": 3229 }, { "epoch": 1.5874931431705979, "grad_norm": 0.20141714461992172, "learning_rate": 3.4526443200975704e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.057458825409412384, "step": 965, "valid_targets_mean": 5831.1, "valid_targets_min": 2745 }, { "epoch": 1.5957213384530993, "grad_norm": 0.19477058216940663, "learning_rate": 3.444727924119511e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.05204876884818077, "step": 970, "valid_targets_mean": 5347.5, "valid_targets_min": 2417 }, { "epoch": 1.6039495337356007, "grad_norm": 0.22865468044098994, "learning_rate": 3.436763907806911e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.053488366305828094, "step": 975, "valid_targets_mean": 5258.5, "valid_targets_min": 720 }, { "epoch": 1.612177729018102, "grad_norm": 0.22074279987171683, "learning_rate": 3.4287525336653335e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.052560918033123016, "step": 980, "valid_targets_mean": 5099.8, "valid_targets_min": 1583 }, { "epoch": 1.6204059243006035, "grad_norm": 0.17850347287453902, "learning_rate": 3.420694065761328e-05, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.05743696168065071, "step": 985, "valid_targets_mean": 5578.4, "valid_targets_min": 2798 }, { "epoch": 1.6286341195831047, "grad_norm": 0.19214912575505724, "learning_rate": 3.412588769713723e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.050386179238557816, "step": 990, "valid_targets_mean": 5036.6, "valid_targets_min": 2310 }, { "epoch": 1.6368623148656063, "grad_norm": 0.19389336692541487, "learning_rate": 3.40443691268487e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.053170040249824524, "step": 995, "valid_targets_mean": 5270.8, "valid_targets_min": 2978 }, { "epoch": 1.6450905101481075, "grad_norm": 0.21103448932645819, "learning_rate": 3.396238763371837e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.05385826528072357, "step": 1000, "valid_targets_mean": 5462.3, "valid_targets_min": 2571 }, { "epoch": 1.6533187054306089, "grad_norm": 0.20655305153916342, "learning_rate": 3.387994591997554e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.050711266696453094, "step": 1005, "valid_targets_mean": 5422.2, "valid_targets_min": 2689 }, { "epoch": 1.6615469007131103, "grad_norm": 0.20405599334414792, "learning_rate": 3.379704670301906e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.05435357242822647, "step": 1010, "valid_targets_mean": 5195.3, "valid_targets_min": 3110 }, { "epoch": 1.6697750959956115, "grad_norm": 0.8352584687550971, "learning_rate": 3.371369271532775e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.19201651215553284, "step": 1015, "valid_targets_mean": 3959.7, "valid_targets_min": 1023 }, { "epoch": 1.678003291278113, "grad_norm": 0.5025769864208273, "learning_rate": 3.362988670437031e-05, "loss": 0.4966, "loss_nan_ranks": 0, "loss_rank_avg": 0.14757052063941956, "step": 1020, "valid_targets_mean": 3057.9, "valid_targets_min": 1066 }, { "epoch": 1.6862314865606143, "grad_norm": 0.3026403609768399, "learning_rate": 3.354563143251483e-05, "loss": 0.4843, "loss_nan_ranks": 0, "loss_rank_avg": 0.1374441534280777, "step": 1025, "valid_targets_mean": 4226.2, "valid_targets_min": 902 }, { "epoch": 1.694459681843116, "grad_norm": 0.3072152435136929, "learning_rate": 3.346092967693764e-05, "loss": 0.4969, "loss_nan_ranks": 0, "loss_rank_avg": 0.14073555171489716, "step": 1030, "valid_targets_mean": 3537.5, "valid_targets_min": 1090 }, { "epoch": 1.702687877125617, "grad_norm": 0.31412887585449273, "learning_rate": 3.3375784229531864e-05, "loss": 0.4868, "loss_nan_ranks": 0, "loss_rank_avg": 0.13491514325141907, "step": 1035, "valid_targets_mean": 3058.2, "valid_targets_min": 771 }, { "epoch": 1.7109160724081185, "grad_norm": 0.36543147309442925, "learning_rate": 3.3290197896815344e-05, "loss": 0.4708, "loss_nan_ranks": 0, "loss_rank_avg": 0.15971092879772186, "step": 1040, "valid_targets_mean": 1120.0, "valid_targets_min": 521 }, { "epoch": 1.71914426769062, "grad_norm": 0.26724180927424696, "learning_rate": 3.320417349983813e-05, "loss": 0.4831, "loss_nan_ranks": 0, "loss_rank_avg": 0.16630011796951294, "step": 1045, "valid_targets_mean": 4731.8, "valid_targets_min": 1389 }, { "epoch": 1.727372462973121, "grad_norm": 0.24730868974709785, "learning_rate": 3.3117713874089516e-05, "loss": 0.455, "loss_nan_ranks": 0, "loss_rank_avg": 0.1551167070865631, "step": 1050, "valid_targets_mean": 4816.6, "valid_targets_min": 1341 }, { "epoch": 1.7356006582556227, "grad_norm": 0.28605184203121603, "learning_rate": 3.303082186940458e-05, "loss": 0.4822, "loss_nan_ranks": 0, "loss_rank_avg": 0.14953917264938354, "step": 1055, "valid_targets_mean": 3374.7, "valid_targets_min": 1239 }, { "epoch": 1.743828853538124, "grad_norm": 0.2673582874164761, "learning_rate": 3.294350034987022e-05, "loss": 0.4692, "loss_nan_ranks": 0, "loss_rank_avg": 0.16546636819839478, "step": 1060, "valid_targets_mean": 3214.4, "valid_targets_min": 621 }, { "epoch": 1.7520570488206253, "grad_norm": 0.2633944966457584, "learning_rate": 3.285575219373079e-05, "loss": 0.4608, "loss_nan_ranks": 0, "loss_rank_avg": 0.17115873098373413, "step": 1065, "valid_targets_mean": 5321.0, "valid_targets_min": 1407 }, { "epoch": 1.7602852441031267, "grad_norm": 0.28138662960460287, "learning_rate": 3.276758029329318e-05, "loss": 0.482, "loss_nan_ranks": 0, "loss_rank_avg": 0.1477651447057724, "step": 1070, "valid_targets_mean": 3536.7, "valid_targets_min": 915 }, { "epoch": 1.768513439385628, "grad_norm": 0.30575007256496134, "learning_rate": 3.267898755483153e-05, "loss": 0.4575, "loss_nan_ranks": 0, "loss_rank_avg": 0.12381979823112488, "step": 1075, "valid_targets_mean": 2772.1, "valid_targets_min": 1106 }, { "epoch": 1.7767416346681295, "grad_norm": 0.4606810569188011, "learning_rate": 3.258997689849142e-05, "loss": 0.4827, "loss_nan_ranks": 0, "loss_rank_avg": 0.29282310605049133, "step": 1080, "valid_targets_mean": 3487.8, "valid_targets_min": 523 }, { "epoch": 1.7849698299506307, "grad_norm": 0.27883070137062055, "learning_rate": 3.250055125819358e-05, "loss": 0.4813, "loss_nan_ranks": 0, "loss_rank_avg": 0.14349916577339172, "step": 1085, "valid_targets_mean": 4307.9, "valid_targets_min": 1207 }, { "epoch": 1.7931980252331323, "grad_norm": 0.2848599685713568, "learning_rate": 3.241071358153723e-05, "loss": 0.4659, "loss_nan_ranks": 0, "loss_rank_avg": 0.17098680138587952, "step": 1090, "valid_targets_mean": 4449.8, "valid_targets_min": 1036 }, { "epoch": 1.8014262205156335, "grad_norm": 0.30529896453924493, "learning_rate": 3.232046682970293e-05, "loss": 0.4793, "loss_nan_ranks": 0, "loss_rank_avg": 0.13532951474189758, "step": 1095, "valid_targets_mean": 3510.9, "valid_targets_min": 1014 }, { "epoch": 1.809654415798135, "grad_norm": 0.28169285171294794, "learning_rate": 3.2229813977354926e-05, "loss": 0.4687, "loss_nan_ranks": 0, "loss_rank_avg": 0.16980434954166412, "step": 1100, "valid_targets_mean": 4310.5, "valid_targets_min": 1193 }, { "epoch": 1.8178826110806363, "grad_norm": 0.26956538256356954, "learning_rate": 3.213875801254314e-05, "loss": 0.4568, "loss_nan_ranks": 0, "loss_rank_avg": 0.13664710521697998, "step": 1105, "valid_targets_mean": 4566.1, "valid_targets_min": 1394 }, { "epoch": 1.8261108063631377, "grad_norm": 0.32339359248442834, "learning_rate": 3.204730193660466e-05, "loss": 0.4743, "loss_nan_ranks": 0, "loss_rank_avg": 0.1973041146993637, "step": 1110, "valid_targets_mean": 3325.2, "valid_targets_min": 883 }, { "epoch": 1.8343390016456391, "grad_norm": 0.3143153411480853, "learning_rate": 3.195544876406482e-05, "loss": 0.4771, "loss_nan_ranks": 0, "loss_rank_avg": 0.16181105375289917, "step": 1115, "valid_targets_mean": 3990.3, "valid_targets_min": 1374 }, { "epoch": 1.8425671969281403, "grad_norm": 0.4224508251606666, "learning_rate": 3.1863201522537843e-05, "loss": 0.4355, "loss_nan_ranks": 0, "loss_rank_avg": 0.143344908952713, "step": 1120, "valid_targets_mean": 5897.4, "valid_targets_min": 347 }, { "epoch": 1.850795392210642, "grad_norm": 0.278768311774877, "learning_rate": 3.177056325262704e-05, "loss": 0.3117, "loss_nan_ranks": 0, "loss_rank_avg": 0.09472917020320892, "step": 1125, "valid_targets_mean": 6455.6, "valid_targets_min": 1359 }, { "epoch": 1.8590235874931431, "grad_norm": 0.22708249957012502, "learning_rate": 3.167753700782457e-05, "loss": 0.281, "loss_nan_ranks": 0, "loss_rank_avg": 0.097655288875103, "step": 1130, "valid_targets_mean": 6676.2, "valid_targets_min": 1143 }, { "epoch": 1.8672517827756445, "grad_norm": 0.22955456223919352, "learning_rate": 3.1584125854410824e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.11995258927345276, "step": 1135, "valid_targets_mean": 6722.4, "valid_targets_min": 505 }, { "epoch": 1.875479978058146, "grad_norm": 0.18939517331373842, "learning_rate": 3.149033287135335e-05, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.10605036467313766, "step": 1140, "valid_targets_mean": 7329.8, "valid_targets_min": 1300 }, { "epoch": 1.8837081733406473, "grad_norm": 0.21555429419147118, "learning_rate": 3.1396161150205324e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.07604040205478668, "step": 1145, "valid_targets_mean": 6100.7, "valid_targets_min": 1328 }, { "epoch": 1.8919363686231487, "grad_norm": 0.18721522620193756, "learning_rate": 3.130161379500371e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.06492835283279419, "step": 1150, "valid_targets_mean": 5562.0, "valid_targets_min": 246 }, { "epoch": 1.90016456390565, "grad_norm": 0.6559450509008863, "learning_rate": 3.120669392216692e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.06112710386514664, "step": 1155, "valid_targets_mean": 1929.8, "valid_targets_min": 503 }, { "epoch": 1.9083927591881515, "grad_norm": 0.19521939318451423, "learning_rate": 3.111140466039205e-05, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.0632120668888092, "step": 1160, "valid_targets_mean": 5253.4, "valid_targets_min": 595 }, { "epoch": 1.9166209544706527, "grad_norm": 0.19764156857068718, "learning_rate": 3.1015749150551835e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.07447328418493271, "step": 1165, "valid_targets_mean": 5247.3, "valid_targets_min": 257 }, { "epoch": 1.9248491497531541, "grad_norm": 0.19862374493029875, "learning_rate": 3.091973054559106e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.07149604707956314, "step": 1170, "valid_targets_mean": 5607.3, "valid_targets_min": 452 }, { "epoch": 1.9330773450356555, "grad_norm": 0.2011133107853708, "learning_rate": 3.082335201042266e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.10824010521173477, "step": 1175, "valid_targets_mean": 7863.1, "valid_targets_min": 1340 }, { "epoch": 1.9413055403181567, "grad_norm": 0.23295729957170552, "learning_rate": 3.0726616721823394e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.15341416001319885, "step": 1180, "valid_targets_mean": 7620.9, "valid_targets_min": 1084 }, { "epoch": 1.9495337356006583, "grad_norm": 0.19668525599135733, "learning_rate": 3.062952786832912e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.08159739524126053, "step": 1185, "valid_targets_mean": 5906.8, "valid_targets_min": 1288 }, { "epoch": 1.9577619308831595, "grad_norm": 0.21883749091726576, "learning_rate": 3.053208865012973e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.0845392718911171, "step": 1190, "valid_targets_mean": 5153.4, "valid_targets_min": 221 }, { "epoch": 1.9659901261656612, "grad_norm": 0.21677746139321524, "learning_rate": 3.0434302278963623e-05, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.10049721598625183, "step": 1195, "valid_targets_mean": 7219.4, "valid_targets_min": 219 }, { "epoch": 1.9742183214481623, "grad_norm": 0.1734827884546814, "learning_rate": 3.0336171978011885e-05, "loss": 0.2645, "loss_nan_ranks": 0, "loss_rank_avg": 0.07478731125593185, "step": 1200, "valid_targets_mean": 5985.7, "valid_targets_min": 292 }, { "epoch": 1.9824465167306637, "grad_norm": 0.19391076236488966, "learning_rate": 3.0237700981792023e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.06688568741083145, "step": 1205, "valid_targets_mean": 5758.3, "valid_targets_min": 310 }, { "epoch": 1.9906747120131651, "grad_norm": 0.1785729712568323, "learning_rate": 3.013889253605135e-05, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.05671679973602295, "step": 1210, "valid_targets_mean": 5599.4, "valid_targets_min": 982 }, { "epoch": 1.9989029072956663, "grad_norm": 0.20992664106258474, "learning_rate": 3.0039749897660005e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.05317822843790054, "step": 1215, "valid_targets_mean": 2148.5, "valid_targets_min": 457 }, { "epoch": 2.006582556226001, "grad_norm": 0.9638756157661459, "learning_rate": 2.9940276334503617e-05, "loss": 0.6179, "loss_nan_ranks": 0, "loss_rank_avg": 0.1680884063243866, "step": 1220, "valid_targets_mean": 6954.8, "valid_targets_min": 1761 }, { "epoch": 2.0148107515085023, "grad_norm": 0.6978276908779179, "learning_rate": 2.984047512537557e-05, "loss": 0.4752, "loss_nan_ranks": 0, "loss_rank_avg": 0.17175118625164032, "step": 1225, "valid_targets_mean": 8220.0, "valid_targets_min": 2842 }, { "epoch": 2.023038946791004, "grad_norm": 0.4316421614618443, "learning_rate": 2.9740349559868918e-05, "loss": 0.4364, "loss_nan_ranks": 0, "loss_rank_avg": 0.13174858689308167, "step": 1230, "valid_targets_mean": 7166.5, "valid_targets_min": 2501 }, { "epoch": 2.031267142073505, "grad_norm": 0.3683054870009327, "learning_rate": 2.9639902938267994e-05, "loss": 0.4043, "loss_nan_ranks": 0, "loss_rank_avg": 0.13023295998573303, "step": 1235, "valid_targets_mean": 6987.4, "valid_targets_min": 1709 }, { "epoch": 2.0394953373560067, "grad_norm": 0.27694022329011136, "learning_rate": 2.9539138571439614e-05, "loss": 0.3873, "loss_nan_ranks": 0, "loss_rank_avg": 0.1342620551586151, "step": 1240, "valid_targets_mean": 7609.8, "valid_targets_min": 2002 }, { "epoch": 2.047723532638508, "grad_norm": 0.2579222382415089, "learning_rate": 2.943805978072391e-05, "loss": 0.3884, "loss_nan_ranks": 0, "loss_rank_avg": 0.12417769432067871, "step": 1245, "valid_targets_mean": 7067.3, "valid_targets_min": 2449 }, { "epoch": 2.055951727921009, "grad_norm": 0.25837969440910324, "learning_rate": 2.933666989782491e-05, "loss": 0.3801, "loss_nan_ranks": 0, "loss_rank_avg": 0.11597777903079987, "step": 1250, "valid_targets_mean": 7091.4, "valid_targets_min": 2861 }, { "epoch": 2.0641799232035107, "grad_norm": 0.2491458862466655, "learning_rate": 2.9234972264700687e-05, "loss": 0.3696, "loss_nan_ranks": 0, "loss_rank_avg": 0.1361021101474762, "step": 1255, "valid_targets_mean": 7742.7, "valid_targets_min": 341 }, { "epoch": 2.072408118486012, "grad_norm": 0.21808961060612198, "learning_rate": 2.913297023345319e-05, "loss": 0.3725, "loss_nan_ranks": 0, "loss_rank_avg": 0.14099043607711792, "step": 1260, "valid_targets_mean": 8509.0, "valid_targets_min": 3043 }, { "epoch": 2.0806363137685135, "grad_norm": 0.22565312170460802, "learning_rate": 2.903066716621779e-05, "loss": 0.3689, "loss_nan_ranks": 0, "loss_rank_avg": 0.11987649649381638, "step": 1265, "valid_targets_mean": 6931.7, "valid_targets_min": 2360 }, { "epoch": 2.0888645090510147, "grad_norm": 0.20315983397248213, "learning_rate": 2.892806643505245e-05, "loss": 0.3582, "loss_nan_ranks": 0, "loss_rank_avg": 0.1136256754398346, "step": 1270, "valid_targets_mean": 9712.0, "valid_targets_min": 2685 }, { "epoch": 2.0970927043335164, "grad_norm": 0.20097162887853337, "learning_rate": 2.8825171421826555e-05, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.11705143749713898, "step": 1275, "valid_targets_mean": 9876.8, "valid_targets_min": 387 }, { "epoch": 2.1053208996160175, "grad_norm": 0.20588709003765224, "learning_rate": 2.8721985518109457e-05, "loss": 0.3355, "loss_nan_ranks": 0, "loss_rank_avg": 0.10917450487613678, "step": 1280, "valid_targets_mean": 9530.9, "valid_targets_min": 5556 }, { "epoch": 2.1135490948985187, "grad_norm": 0.2078925688921669, "learning_rate": 2.861851212505869e-05, "loss": 0.325, "loss_nan_ranks": 0, "loss_rank_avg": 0.11689627170562744, "step": 1285, "valid_targets_mean": 9594.7, "valid_targets_min": 4603 }, { "epoch": 2.1217772901810203, "grad_norm": 0.20054485627408972, "learning_rate": 2.8514754653307836e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.11187094449996948, "step": 1290, "valid_targets_mean": 9466.0, "valid_targets_min": 6389 }, { "epoch": 2.1300054854635215, "grad_norm": 0.22534885286504078, "learning_rate": 2.8410716522854152e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.10926699638366699, "step": 1295, "valid_targets_mean": 9956.4, "valid_targets_min": 4744 }, { "epoch": 2.138233680746023, "grad_norm": 0.22280970786481757, "learning_rate": 2.8306401162945795e-05, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.11518752574920654, "step": 1300, "valid_targets_mean": 9960.5, "valid_targets_min": 6172 }, { "epoch": 2.1464618760285243, "grad_norm": 0.21839411779582002, "learning_rate": 2.8201812011968807e-05, "loss": 0.3282, "loss_nan_ranks": 0, "loss_rank_avg": 0.10992267727851868, "step": 1305, "valid_targets_mean": 9848.8, "valid_targets_min": 751 }, { "epoch": 2.154690071311026, "grad_norm": 0.21794272450141897, "learning_rate": 2.809695251733379e-05, "loss": 0.3265, "loss_nan_ranks": 0, "loss_rank_avg": 0.1086210310459137, "step": 1310, "valid_targets_mean": 9407.0, "valid_targets_min": 2003 }, { "epoch": 2.162918266593527, "grad_norm": 0.2210245319595092, "learning_rate": 2.799182613536226e-05, "loss": 0.3264, "loss_nan_ranks": 0, "loss_rank_avg": 0.10626842081546783, "step": 1315, "valid_targets_mean": 9471.5, "valid_targets_min": 4297 }, { "epoch": 2.1711464618760283, "grad_norm": 0.22990804540391607, "learning_rate": 2.7886436331172745e-05, "loss": 0.3257, "loss_nan_ranks": 0, "loss_rank_avg": 0.10737085342407227, "step": 1320, "valid_targets_mean": 8577.6, "valid_targets_min": 3933 }, { "epoch": 2.17937465715853, "grad_norm": 0.205922355272621, "learning_rate": 2.7780786578566524e-05, "loss": 0.3213, "loss_nan_ranks": 0, "loss_rank_avg": 0.1152525395154953, "step": 1325, "valid_targets_mean": 9960.7, "valid_targets_min": 1490 }, { "epoch": 2.187602852441031, "grad_norm": 0.1876585353072035, "learning_rate": 2.7674880359913183e-05, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.10439243167638779, "step": 1330, "valid_targets_mean": 9948.3, "valid_targets_min": 3344 }, { "epoch": 2.1958310477235328, "grad_norm": 0.20859391800680568, "learning_rate": 2.7568721166035778e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.09820768982172012, "step": 1335, "valid_targets_mean": 9342.2, "valid_targets_min": 3715 }, { "epoch": 2.204059243006034, "grad_norm": 0.22628943045344366, "learning_rate": 2.7462312496095805e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.11237113922834396, "step": 1340, "valid_targets_mean": 9508.4, "valid_targets_min": 434 }, { "epoch": 2.2122874382885356, "grad_norm": 0.20135082037861282, "learning_rate": 2.735565785747787e-05, "loss": 0.3271, "loss_nan_ranks": 0, "loss_rank_avg": 0.10496258735656738, "step": 1345, "valid_targets_mean": 9982.4, "valid_targets_min": 3744 }, { "epoch": 2.2205156335710368, "grad_norm": 0.22074725520877453, "learning_rate": 2.7248760765674033e-05, "loss": 0.3156, "loss_nan_ranks": 0, "loss_rank_avg": 0.10917022824287415, "step": 1350, "valid_targets_mean": 9832.3, "valid_targets_min": 5100 }, { "epoch": 2.228743828853538, "grad_norm": 0.2212465257169665, "learning_rate": 2.7141624744168e-05, "loss": 0.3177, "loss_nan_ranks": 0, "loss_rank_avg": 0.1113644689321518, "step": 1355, "valid_targets_mean": 10835.8, "valid_targets_min": 2829 }, { "epoch": 2.2369720241360396, "grad_norm": 0.19921061855711575, "learning_rate": 2.703425332431891e-05, "loss": 0.3222, "loss_nan_ranks": 0, "loss_rank_avg": 0.10436619818210602, "step": 1360, "valid_targets_mean": 10256.2, "valid_targets_min": 5379 }, { "epoch": 2.2452002194185408, "grad_norm": 0.23316937250636952, "learning_rate": 2.6926650045245014e-05, "loss": 0.3216, "loss_nan_ranks": 0, "loss_rank_avg": 0.09406248480081558, "step": 1365, "valid_targets_mean": 9251.9, "valid_targets_min": 648 }, { "epoch": 2.2534284147010424, "grad_norm": 0.1967403350878879, "learning_rate": 2.6818818453706944e-05, "loss": 0.3191, "loss_nan_ranks": 0, "loss_rank_avg": 0.11360487341880798, "step": 1370, "valid_targets_mean": 11007.1, "valid_targets_min": 1456 }, { "epoch": 2.2616566099835436, "grad_norm": 0.22084889534546884, "learning_rate": 2.6710762103990856e-05, "loss": 0.323, "loss_nan_ranks": 0, "loss_rank_avg": 0.10803453624248505, "step": 1375, "valid_targets_mean": 9657.8, "valid_targets_min": 2733 }, { "epoch": 2.269884805266045, "grad_norm": 0.20093362465257963, "learning_rate": 2.660248455779128e-05, "loss": 0.318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12841132283210754, "step": 1380, "valid_targets_mean": 10753.2, "valid_targets_min": 5581 }, { "epoch": 2.2781130005485464, "grad_norm": 0.20269530317142032, "learning_rate": 2.6493989384093674e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.10728751868009567, "step": 1385, "valid_targets_mean": 9586.8, "valid_targets_min": 3841 }, { "epoch": 2.2863411958310476, "grad_norm": 0.2946661577910316, "learning_rate": 2.6385280159056838e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.09770511090755463, "step": 1390, "valid_targets_mean": 9004.5, "valid_targets_min": 434 }, { "epoch": 2.294569391113549, "grad_norm": 0.23257347797723024, "learning_rate": 2.6276360465895004e-05, "loss": 0.3172, "loss_nan_ranks": 0, "loss_rank_avg": 0.09528092294931412, "step": 1395, "valid_targets_mean": 9294.9, "valid_targets_min": 4130 }, { "epoch": 2.3027975863960504, "grad_norm": 0.22704053553458559, "learning_rate": 2.6167233894759743e-05, "loss": 0.3109, "loss_nan_ranks": 0, "loss_rank_avg": 0.10657741874456406, "step": 1400, "valid_targets_mean": 10179.0, "valid_targets_min": 4267 }, { "epoch": 2.311025781678552, "grad_norm": 0.21046171710437353, "learning_rate": 2.6057904042621625e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.09410691261291504, "step": 1405, "valid_targets_mean": 8532.7, "valid_targets_min": 417 }, { "epoch": 2.319253976961053, "grad_norm": 0.24250405396092567, "learning_rate": 2.5948374513151668e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.12210428714752197, "step": 1410, "valid_targets_mean": 6747.5, "valid_targets_min": 401 }, { "epoch": 2.3274821722435544, "grad_norm": 0.2738588406052067, "learning_rate": 2.583864891660252e-05, "loss": 0.3357, "loss_nan_ranks": 0, "loss_rank_avg": 0.10755414515733719, "step": 1415, "valid_targets_mean": 5423.5, "valid_targets_min": 369 }, { "epoch": 2.335710367526056, "grad_norm": 2.4982151917439483, "learning_rate": 2.5728730869689505e-05, "loss": 0.4375, "loss_nan_ranks": 0, "loss_rank_avg": 0.2848479747772217, "step": 1420, "valid_targets_mean": 3791.8, "valid_targets_min": 1231 }, { "epoch": 2.343938562808557, "grad_norm": 0.6190427970922461, "learning_rate": 2.5618623995471394e-05, "loss": 0.6956, "loss_nan_ranks": 0, "loss_rank_avg": 0.20855411887168884, "step": 1425, "valid_targets_mean": 4159.7, "valid_targets_min": 1267 }, { "epoch": 2.352166758091059, "grad_norm": 0.5754941700932448, "learning_rate": 2.5508331923230963e-05, "loss": 0.6226, "loss_nan_ranks": 0, "loss_rank_avg": 0.1878442019224167, "step": 1430, "valid_targets_mean": 3654.0, "valid_targets_min": 1421 }, { "epoch": 2.36039495337356, "grad_norm": 0.3930300076882507, "learning_rate": 2.5397858288355397e-05, "loss": 0.6106, "loss_nan_ranks": 0, "loss_rank_avg": 0.17351096868515015, "step": 1435, "valid_targets_mean": 2945.1, "valid_targets_min": 996 }, { "epoch": 2.3686231486560616, "grad_norm": 0.32216825686035716, "learning_rate": 2.5287206732216453e-05, "loss": 0.5819, "loss_nan_ranks": 0, "loss_rank_avg": 0.20648203790187836, "step": 1440, "valid_targets_mean": 4179.1, "valid_targets_min": 1183 }, { "epoch": 2.376851343938563, "grad_norm": 0.2956785702719909, "learning_rate": 2.5176380902050418e-05, "loss": 0.5457, "loss_nan_ranks": 0, "loss_rank_avg": 0.17796429991722107, "step": 1445, "valid_targets_mean": 4048.5, "valid_targets_min": 1297 }, { "epoch": 2.3850795392210644, "grad_norm": 0.28597121366642053, "learning_rate": 2.5065384450837916e-05, "loss": 0.5422, "loss_nan_ranks": 0, "loss_rank_avg": 0.17518360912799835, "step": 1450, "valid_targets_mean": 4272.8, "valid_targets_min": 1187 }, { "epoch": 2.3933077345035656, "grad_norm": 0.2921318011955971, "learning_rate": 2.495422103718349e-05, "loss": 0.5542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2636011242866516, "step": 1455, "valid_targets_mean": 4842.6, "valid_targets_min": 1298 }, { "epoch": 2.401535929786067, "grad_norm": 0.28775359794170824, "learning_rate": 2.4842894325194996e-05, "loss": 0.5454, "loss_nan_ranks": 0, "loss_rank_avg": 0.21379245817661285, "step": 1460, "valid_targets_mean": 4255.8, "valid_targets_min": 1314 }, { "epoch": 2.4097641250685684, "grad_norm": 0.27746274584622366, "learning_rate": 2.473140798436285e-05, "loss": 0.5415, "loss_nan_ranks": 0, "loss_rank_avg": 0.16948026418685913, "step": 1465, "valid_targets_mean": 4050.4, "valid_targets_min": 1624 }, { "epoch": 2.4179923203510696, "grad_norm": 0.2809157030625528, "learning_rate": 2.4619765689439064e-05, "loss": 0.5188, "loss_nan_ranks": 0, "loss_rank_avg": 0.16582998633384705, "step": 1470, "valid_targets_mean": 3251.1, "valid_targets_min": 1018 }, { "epoch": 2.426220515633571, "grad_norm": 0.27242860017545745, "learning_rate": 2.4507971120316128e-05, "loss": 0.5321, "loss_nan_ranks": 0, "loss_rank_avg": 0.18139344453811646, "step": 1475, "valid_targets_mean": 3961.1, "valid_targets_min": 1033 }, { "epoch": 2.4344487109160724, "grad_norm": 0.2572967478845345, "learning_rate": 2.4396027961905704e-05, "loss": 0.5298, "loss_nan_ranks": 0, "loss_rank_avg": 0.19407576322555542, "step": 1480, "valid_targets_mean": 5018.0, "valid_targets_min": 1101 }, { "epoch": 2.4426769061985736, "grad_norm": 0.2729508689206608, "learning_rate": 2.4283939904017183e-05, "loss": 0.5344, "loss_nan_ranks": 0, "loss_rank_avg": 0.19475191831588745, "step": 1485, "valid_targets_mean": 4231.1, "valid_targets_min": 1310 }, { "epoch": 2.450905101481075, "grad_norm": 0.2922531287196005, "learning_rate": 2.4171710641236045e-05, "loss": 0.5288, "loss_nan_ranks": 0, "loss_rank_avg": 0.16344180703163147, "step": 1490, "valid_targets_mean": 3704.2, "valid_targets_min": 1093 }, { "epoch": 2.4591332967635764, "grad_norm": 0.29625471879334625, "learning_rate": 2.4059343872802084e-05, "loss": 0.5464, "loss_nan_ranks": 0, "loss_rank_avg": 0.17003777623176575, "step": 1495, "valid_targets_mean": 3797.5, "valid_targets_min": 1323 }, { "epoch": 2.467361492046078, "grad_norm": 0.28096087867759284, "learning_rate": 2.3946843302487497e-05, "loss": 0.5458, "loss_nan_ranks": 0, "loss_rank_avg": 0.17858433723449707, "step": 1500, "valid_targets_mean": 3499.0, "valid_targets_min": 665 }, { "epoch": 2.475589687328579, "grad_norm": 0.261118921385376, "learning_rate": 2.3834212638474773e-05, "loss": 0.5307, "loss_nan_ranks": 0, "loss_rank_avg": 0.18844759464263916, "step": 1505, "valid_targets_mean": 5092.9, "valid_targets_min": 1149 }, { "epoch": 2.483817882611081, "grad_norm": 0.2831486710543651, "learning_rate": 2.372145559323448e-05, "loss": 0.5428, "loss_nan_ranks": 0, "loss_rank_avg": 0.2189253866672516, "step": 1510, "valid_targets_mean": 4786.8, "valid_targets_min": 1492 }, { "epoch": 2.492046077893582, "grad_norm": 0.27484534472121397, "learning_rate": 2.3608575883402903e-05, "loss": 0.5438, "loss_nan_ranks": 0, "loss_rank_avg": 0.18232977390289307, "step": 1515, "valid_targets_mean": 4219.8, "valid_targets_min": 776 }, { "epoch": 2.5002742731760836, "grad_norm": 0.4465063057356539, "learning_rate": 2.3495577229659515e-05, "loss": 0.4163, "loss_nan_ranks": 0, "loss_rank_avg": 0.06493039429187775, "step": 1520, "valid_targets_mean": 5702.6, "valid_targets_min": 2936 }, { "epoch": 2.508502468458585, "grad_norm": 0.340790384582099, "learning_rate": 2.3382463356604378e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.05560822784900665, "step": 1525, "valid_targets_mean": 5383.9, "valid_targets_min": 3193 }, { "epoch": 2.516730663741086, "grad_norm": 0.23433249286165134, "learning_rate": 2.3269237992635318e-05, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.05000593140721321, "step": 1530, "valid_targets_mean": 5404.5, "valid_targets_min": 3254 }, { "epoch": 2.5249588590235876, "grad_norm": 0.21914046561271092, "learning_rate": 2.31559048698251e-05, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.051547035574913025, "step": 1535, "valid_targets_mean": 5669.6, "valid_targets_min": 2339 }, { "epoch": 2.533187054306089, "grad_norm": 0.2022698368996799, "learning_rate": 2.3042467723798335e-05, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.05184007063508034, "step": 1540, "valid_targets_mean": 5712.7, "valid_targets_min": 2963 }, { "epoch": 2.5414152495885904, "grad_norm": 0.1880847339367831, "learning_rate": 2.2928930293608435e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.0460038036108017, "step": 1545, "valid_targets_mean": 5044.9, "valid_targets_min": 2759 }, { "epoch": 2.5496434448710916, "grad_norm": 0.18085215046098602, "learning_rate": 2.281529632161429e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.0443473756313324, "step": 1550, "valid_targets_mean": 5219.8, "valid_targets_min": 2654 }, { "epoch": 2.557871640153593, "grad_norm": 0.19614621783834488, "learning_rate": 2.2701569553356963e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.047740936279296875, "step": 1555, "valid_targets_mean": 5413.7, "valid_targets_min": 3427 }, { "epoch": 2.5660998354360944, "grad_norm": 0.18143070301123154, "learning_rate": 2.2587753737436217e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.04606207087635994, "step": 1560, "valid_targets_mean": 5462.3, "valid_targets_min": 3458 }, { "epoch": 2.5743280307185956, "grad_norm": 0.21959475347948587, "learning_rate": 2.247385262538696e-05, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.05131494253873825, "step": 1565, "valid_targets_mean": 5651.2, "valid_targets_min": 2078 }, { "epoch": 2.5825562260010972, "grad_norm": 0.18550933231717945, "learning_rate": 2.235986997155556e-05, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.04456018656492233, "step": 1570, "valid_targets_mean": 5431.2, "valid_targets_min": 1278 }, { "epoch": 2.5907844212835984, "grad_norm": 0.25278930145039497, "learning_rate": 2.2245809532976157e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.04588646814227104, "step": 1575, "valid_targets_mean": 5013.1, "valid_targets_min": 2521 }, { "epoch": 2.5990126165660996, "grad_norm": 0.21124774470898763, "learning_rate": 2.2131675069246758e-05, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.042148131877183914, "step": 1580, "valid_targets_mean": 5014.3, "valid_targets_min": 2703 }, { "epoch": 2.6072408118486012, "grad_norm": 0.20744467482599036, "learning_rate": 2.201747034240537e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.044687531888484955, "step": 1585, "valid_targets_mean": 5006.2, "valid_targets_min": 2670 }, { "epoch": 2.6154690071311024, "grad_norm": 0.18358585696946206, "learning_rate": 2.1903199116805953e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.05012306571006775, "step": 1590, "valid_targets_mean": 6038.5, "valid_targets_min": 3631 }, { "epoch": 2.623697202413604, "grad_norm": 0.2389717332734137, "learning_rate": 2.1788865158994384e-05, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.05136081576347351, "step": 1595, "valid_targets_mean": 4937.4, "valid_targets_min": 2598 }, { "epoch": 2.6319253976961052, "grad_norm": 0.1946054551208735, "learning_rate": 2.1674472237584272e-05, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.046021468937397, "step": 1600, "valid_targets_mean": 5467.6, "valid_targets_min": 2990 }, { "epoch": 2.640153592978607, "grad_norm": 0.2157540275683584, "learning_rate": 2.1560024123132755e-05, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.04845328629016876, "step": 1605, "valid_targets_mean": 5111.8, "valid_targets_min": 2044 }, { "epoch": 2.648381788261108, "grad_norm": 0.20199076365851348, "learning_rate": 2.1445524588016214e-05, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.0499688945710659, "step": 1610, "valid_targets_mean": 5763.9, "valid_targets_min": 2904 }, { "epoch": 2.6566099835436097, "grad_norm": 0.19383269744904036, "learning_rate": 2.1330977406305933e-05, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.044633202254772186, "step": 1615, "valid_targets_mean": 4922.0, "valid_targets_min": 2500 }, { "epoch": 2.664838178826111, "grad_norm": 0.20125926925518162, "learning_rate": 2.1216386353643686e-05, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.04471147805452347, "step": 1620, "valid_targets_mean": 5118.9, "valid_targets_min": 2923 }, { "epoch": 2.673066374108612, "grad_norm": 0.3738083632546402, "learning_rate": 2.110175520711731e-05, "loss": 0.3568, "loss_nan_ranks": 0, "loss_rank_avg": 0.14241358637809753, "step": 1625, "valid_targets_mean": 3042.4, "valid_targets_min": 1100 }, { "epoch": 2.6812945693911137, "grad_norm": 0.3399624573266519, "learning_rate": 2.098708774513619e-05, "loss": 0.4743, "loss_nan_ranks": 0, "loss_rank_avg": 0.18090471625328064, "step": 1630, "valid_targets_mean": 4385.5, "valid_targets_min": 891 }, { "epoch": 2.689522764673615, "grad_norm": 0.38175053443981743, "learning_rate": 2.0872387747306725e-05, "loss": 0.4392, "loss_nan_ranks": 0, "loss_rank_avg": 0.1515863686800003, "step": 1635, "valid_targets_mean": 1813.8, "valid_targets_min": 507 }, { "epoch": 2.6977509599561165, "grad_norm": 0.2944089441499447, "learning_rate": 2.075765899430773e-05, "loss": 0.4485, "loss_nan_ranks": 0, "loss_rank_avg": 0.13034245371818542, "step": 1640, "valid_targets_mean": 3846.0, "valid_targets_min": 1237 }, { "epoch": 2.7059791552386177, "grad_norm": 0.26016259566125427, "learning_rate": 2.0642905267765846e-05, "loss": 0.4374, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433674395084381, "step": 1645, "valid_targets_mean": 4735.8, "valid_targets_min": 910 }, { "epoch": 2.714207350521119, "grad_norm": 0.29076860147451133, "learning_rate": 2.0528130350130867e-05, "loss": 0.4346, "loss_nan_ranks": 0, "loss_rank_avg": 0.1388690173625946, "step": 1650, "valid_targets_mean": 3882.9, "valid_targets_min": 1176 }, { "epoch": 2.7224355458036205, "grad_norm": 0.27279308035940975, "learning_rate": 2.041333802455109e-05, "loss": 0.4311, "loss_nan_ranks": 0, "loss_rank_avg": 0.1723819077014923, "step": 1655, "valid_targets_mean": 4241.8, "valid_targets_min": 1013 }, { "epoch": 2.7306637410861216, "grad_norm": 0.22293614986974064, "learning_rate": 2.0298532074748594e-05, "loss": 0.4087, "loss_nan_ranks": 0, "loss_rank_avg": 0.11925294995307922, "step": 1660, "valid_targets_mean": 4934.8, "valid_targets_min": 1378 }, { "epoch": 2.7388919363686233, "grad_norm": 0.2864792947502029, "learning_rate": 2.0183716284894533e-05, "loss": 0.451, "loss_nan_ranks": 0, "loss_rank_avg": 0.1562422215938568, "step": 1665, "valid_targets_mean": 3635.7, "valid_targets_min": 1162 }, { "epoch": 2.7471201316511245, "grad_norm": 0.28246275393534515, "learning_rate": 2.00688944394844e-05, "loss": 0.4236, "loss_nan_ranks": 0, "loss_rank_avg": 0.12074942141771317, "step": 1670, "valid_targets_mean": 3513.8, "valid_targets_min": 1441 }, { "epoch": 2.7553483269336256, "grad_norm": 0.6175672954446245, "learning_rate": 1.9954070323213296e-05, "loss": 0.4337, "loss_nan_ranks": 0, "loss_rank_avg": 0.2847403883934021, "step": 1675, "valid_targets_mean": 4413.0, "valid_targets_min": 1233 }, { "epoch": 2.7635765222161273, "grad_norm": 0.23873518139179745, "learning_rate": 1.9839247720851178e-05, "loss": 0.4245, "loss_nan_ranks": 0, "loss_rank_avg": 0.10815485566854477, "step": 1680, "valid_targets_mean": 3737.7, "valid_targets_min": 1650 }, { "epoch": 2.771804717498629, "grad_norm": 0.27032318641137143, "learning_rate": 1.9724430417118074e-05, "loss": 0.4213, "loss_nan_ranks": 0, "loss_rank_avg": 0.11345283687114716, "step": 1685, "valid_targets_mean": 3766.6, "valid_targets_min": 1250 }, { "epoch": 2.78003291278113, "grad_norm": 0.2881813172917136, "learning_rate": 1.9609622196559402e-05, "loss": 0.4447, "loss_nan_ranks": 0, "loss_rank_avg": 0.13241040706634521, "step": 1690, "valid_targets_mean": 3043.5, "valid_targets_min": 1208 }, { "epoch": 2.7882611080636313, "grad_norm": 0.25597327371881795, "learning_rate": 1.9494826843421147e-05, "loss": 0.4473, "loss_nan_ranks": 0, "loss_rank_avg": 0.15462671220302582, "step": 1695, "valid_targets_mean": 4615.1, "valid_targets_min": 269 }, { "epoch": 2.796489303346133, "grad_norm": 0.2656100599955537, "learning_rate": 1.9380048141525194e-05, "loss": 0.4193, "loss_nan_ranks": 0, "loss_rank_avg": 0.13796931505203247, "step": 1700, "valid_targets_mean": 5172.2, "valid_targets_min": 1589 }, { "epoch": 2.804717498628634, "grad_norm": 0.28598719744173756, "learning_rate": 1.9265289874144554e-05, "loss": 0.446, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630500853061676, "step": 1705, "valid_targets_mean": 4159.3, "valid_targets_min": 1283 }, { "epoch": 2.8129456939111357, "grad_norm": 0.27527634681188917, "learning_rate": 1.9150555823878708e-05, "loss": 0.4301, "loss_nan_ranks": 0, "loss_rank_avg": 0.155914306640625, "step": 1710, "valid_targets_mean": 4058.6, "valid_targets_min": 876 }, { "epoch": 2.821173889193637, "grad_norm": 0.2853993592486656, "learning_rate": 1.9035849772528907e-05, "loss": 0.4168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1859429031610489, "step": 1715, "valid_targets_mean": 4401.0, "valid_targets_min": 1349 }, { "epoch": 2.829402084476138, "grad_norm": 0.2519814408323229, "learning_rate": 1.8921175500973496e-05, "loss": 0.4388, "loss_nan_ranks": 0, "loss_rank_avg": 0.12586364150047302, "step": 1720, "valid_targets_mean": 3505.7, "valid_targets_min": 809 }, { "epoch": 2.8376302797586397, "grad_norm": 0.25743712856714657, "learning_rate": 1.8806536789043322e-05, "loss": 0.4373, "loss_nan_ranks": 0, "loss_rank_avg": 0.11665894091129303, "step": 1725, "valid_targets_mean": 3860.3, "valid_targets_min": 602 }, { "epoch": 2.845858475041141, "grad_norm": 0.3117452905892116, "learning_rate": 1.869193741539714e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.11202247440814972, "step": 1730, "valid_targets_mean": 8001.6, "valid_targets_min": 1252 }, { "epoch": 2.8540866703236425, "grad_norm": 0.21933985341011952, "learning_rate": 1.8577381157397056e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.08016058057546616, "step": 1735, "valid_targets_mean": 6021.0, "valid_targets_min": 389 }, { "epoch": 2.8623148656061437, "grad_norm": 0.22902224638423593, "learning_rate": 1.8462871790984015e-05, "loss": 0.2631, "loss_nan_ranks": 0, "loss_rank_avg": 0.12745118141174316, "step": 1740, "valid_targets_mean": 6741.6, "valid_targets_min": 473 }, { "epoch": 2.870543060888645, "grad_norm": 0.21401347256438896, "learning_rate": 1.8348413090553356e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.07021795213222504, "step": 1745, "valid_targets_mean": 5457.3, "valid_targets_min": 253 }, { "epoch": 2.8787712561711465, "grad_norm": 0.19462902063881504, "learning_rate": 1.8234008828830386e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.08573737740516663, "step": 1750, "valid_targets_mean": 6283.3, "valid_targets_min": 146 }, { "epoch": 2.8869994514536477, "grad_norm": 0.202942917615318, "learning_rate": 1.8119662776746043e-05, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.08039772510528564, "step": 1755, "valid_targets_mean": 6143.3, "valid_targets_min": 233 }, { "epoch": 2.8952276467361493, "grad_norm": 0.17992757298307224, "learning_rate": 1.800537870331257e-05, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.06841991096735, "step": 1760, "valid_targets_mean": 6087.1, "valid_targets_min": 1118 }, { "epoch": 2.9034558420186505, "grad_norm": 0.17660821788526068, "learning_rate": 1.789116037549933e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.08433274179697037, "step": 1765, "valid_targets_mean": 6520.0, "valid_targets_min": 178 }, { "epoch": 2.911684037301152, "grad_norm": 0.188845019321141, "learning_rate": 1.77770115581086e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.08890101313591003, "step": 1770, "valid_targets_mean": 6715.5, "valid_targets_min": 744 }, { "epoch": 2.9199122325836533, "grad_norm": 0.2250077260143483, "learning_rate": 1.7662936013651493e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.053828299045562744, "step": 1775, "valid_targets_mean": 1099.6, "valid_targets_min": 316 }, { "epoch": 2.928140427866155, "grad_norm": 0.18320311040212517, "learning_rate": 1.7548937502223932e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.061102431267499924, "step": 1780, "valid_targets_mean": 5019.2, "valid_targets_min": 247 }, { "epoch": 2.936368623148656, "grad_norm": 0.17206280683714112, "learning_rate": 1.7435019781382737e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.09793031215667725, "step": 1785, "valid_targets_mean": 7409.7, "valid_targets_min": 1034 }, { "epoch": 2.9445968184311573, "grad_norm": 0.19580444227484753, "learning_rate": 1.732118660602175e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.054457198828458786, "step": 1790, "valid_targets_mean": 4764.1, "valid_targets_min": 243 }, { "epoch": 2.952825013713659, "grad_norm": 0.19600050749352133, "learning_rate": 1.7207441728248055e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.08765925467014313, "step": 1795, "valid_targets_mean": 6958.2, "valid_targets_min": 1080 }, { "epoch": 2.96105320899616, "grad_norm": 0.20856937565072015, "learning_rate": 1.7093788897258338e-05, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.13853465020656586, "step": 1800, "valid_targets_mean": 7221.4, "valid_targets_min": 405 }, { "epoch": 2.9692814042786617, "grad_norm": 0.1961668365424937, "learning_rate": 1.698023185921526e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.10164403915405273, "step": 1805, "valid_targets_mean": 7585.1, "valid_targets_min": 1495 }, { "epoch": 2.977509599561163, "grad_norm": 0.19497785486683333, "learning_rate": 1.6866774357124054e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.1096169725060463, "step": 1810, "valid_targets_mean": 6407.4, "valid_targets_min": 201 }, { "epoch": 2.985737794843664, "grad_norm": 0.17898913986619544, "learning_rate": 1.675342013070905e-05, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.06940888613462448, "step": 1815, "valid_targets_mean": 6268.8, "valid_targets_min": 536 }, { "epoch": 2.9939659901261657, "grad_norm": 0.18783301380836664, "learning_rate": 1.6640172916290515e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.11000367999076843, "step": 1820, "valid_targets_mean": 6778.3, "valid_targets_min": 674 }, { "epoch": 3.0016456390565, "grad_norm": 2.617429539265205, "learning_rate": 1.6527036446661396e-05, "loss": 0.4103, "loss_nan_ranks": 0, "loss_rank_avg": 0.22323724627494812, "step": 1825, "valid_targets_mean": 7264.4, "valid_targets_min": 1973 }, { "epoch": 3.0098738343390017, "grad_norm": 0.8824033570259873, "learning_rate": 1.641401445096436e-05, "loss": 0.5455, "loss_nan_ranks": 0, "loss_rank_avg": 0.1985154151916504, "step": 1830, "valid_targets_mean": 9100.2, "valid_targets_min": 3178 }, { "epoch": 3.018102029621503, "grad_norm": 0.7118784346337131, "learning_rate": 1.6301110654568833e-05, "loss": 0.4481, "loss_nan_ranks": 0, "loss_rank_avg": 0.13510319590568542, "step": 1835, "valid_targets_mean": 6959.6, "valid_targets_min": 2166 }, { "epoch": 3.0263302249040045, "grad_norm": 0.48035427814678705, "learning_rate": 1.6188328778948238e-05, "loss": 0.4066, "loss_nan_ranks": 0, "loss_rank_avg": 0.1353878676891327, "step": 1840, "valid_targets_mean": 7188.0, "valid_targets_min": 2166 }, { "epoch": 3.0345584201865057, "grad_norm": 0.3563748368494854, "learning_rate": 1.6075672541557287e-05, "loss": 0.3745, "loss_nan_ranks": 0, "loss_rank_avg": 0.13746076822280884, "step": 1845, "valid_targets_mean": 6959.9, "valid_targets_min": 2083 }, { "epoch": 3.0427866154690073, "grad_norm": 0.2528267340757668, "learning_rate": 1.5963145655709495e-05, "loss": 0.366, "loss_nan_ranks": 0, "loss_rank_avg": 0.13522320985794067, "step": 1850, "valid_targets_mean": 7818.4, "valid_targets_min": 2042 }, { "epoch": 3.0510148107515085, "grad_norm": 0.235073091120978, "learning_rate": 1.5850751830454747e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.12187724560499191, "step": 1855, "valid_targets_mean": 7926.4, "valid_targets_min": 3527 }, { "epoch": 3.0592430060340097, "grad_norm": 0.22130659813335654, "learning_rate": 1.573849477045706e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.10538642853498459, "step": 1860, "valid_targets_mean": 6605.4, "valid_targets_min": 2848 }, { "epoch": 3.0674712013165113, "grad_norm": 0.22662966396011508, "learning_rate": 1.5626378175872486e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.11400727927684784, "step": 1865, "valid_targets_mean": 6947.1, "valid_targets_min": 2244 }, { "epoch": 3.0756993965990125, "grad_norm": 0.23238049650837628, "learning_rate": 1.5514405742227103e-05, "loss": 0.3478, "loss_nan_ranks": 0, "loss_rank_avg": 0.11836406588554382, "step": 1870, "valid_targets_mean": 7027.9, "valid_targets_min": 340 }, { "epoch": 3.083927591881514, "grad_norm": 0.20760299511274713, "learning_rate": 1.5402581160295265e-05, "loss": 0.3424, "loss_nan_ranks": 0, "loss_rank_avg": 0.13461612164974213, "step": 1875, "valid_targets_mean": 8959.9, "valid_targets_min": 3446 }, { "epoch": 3.0921557871640153, "grad_norm": 0.20502093564997662, "learning_rate": 1.5290908115977884e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.10294201970100403, "step": 1880, "valid_targets_mean": 9482.4, "valid_targets_min": 5095 }, { "epoch": 3.100383982446517, "grad_norm": 0.19747411277171628, "learning_rate": 1.5179390290181013e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.09898518025875092, "step": 1885, "valid_targets_mean": 8913.7, "valid_targets_min": 251 }, { "epoch": 3.108612177729018, "grad_norm": 0.19042094134064866, "learning_rate": 1.5068031358694437e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.10452181100845337, "step": 1890, "valid_targets_mean": 8780.3, "valid_targets_min": 349 }, { "epoch": 3.1168403730115193, "grad_norm": 0.18674667249593555, "learning_rate": 1.4956834992070589e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.10294011235237122, "step": 1895, "valid_targets_mean": 9303.8, "valid_targets_min": 773 }, { "epoch": 3.125068568294021, "grad_norm": 0.18439896531534866, "learning_rate": 1.4845804855503494e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.1009887233376503, "step": 1900, "valid_targets_mean": 9819.0, "valid_targets_min": 5584 }, { "epoch": 3.133296763576522, "grad_norm": 0.18693371137153128, "learning_rate": 1.4734944608708022e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.10432776808738708, "step": 1905, "valid_targets_mean": 9100.7, "valid_targets_min": 306 }, { "epoch": 3.1415249588590237, "grad_norm": 0.1968021432855259, "learning_rate": 1.46242579057992e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.10337679833173752, "step": 1910, "valid_targets_mean": 9212.3, "valid_targets_min": 378 }, { "epoch": 3.149753154141525, "grad_norm": 0.19727420663031295, "learning_rate": 1.451374839517183e-05, "loss": 0.3035, "loss_nan_ranks": 0, "loss_rank_avg": 0.09127824008464813, "step": 1915, "valid_targets_mean": 8648.9, "valid_targets_min": 1557 }, { "epoch": 3.1579813494240265, "grad_norm": 0.2133142568969134, "learning_rate": 1.4403419719380161e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.11271902918815613, "step": 1920, "valid_targets_mean": 10183.4, "valid_targets_min": 3886 }, { "epoch": 3.1662095447065277, "grad_norm": 0.19051586500080203, "learning_rate": 1.42932755150179e-05, "loss": 0.3011, "loss_nan_ranks": 0, "loss_rank_avg": 0.09688104689121246, "step": 1925, "valid_targets_mean": 9594.6, "valid_targets_min": 344 }, { "epoch": 3.174437739989029, "grad_norm": 0.1872830976899931, "learning_rate": 1.4183319412598274e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.09433311969041824, "step": 1930, "valid_targets_mean": 8928.9, "valid_targets_min": 897 }, { "epoch": 3.1826659352715305, "grad_norm": 0.1999039787769261, "learning_rate": 1.4073555036434423e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.10328617691993713, "step": 1935, "valid_targets_mean": 9772.7, "valid_targets_min": 3574 }, { "epoch": 3.1908941305540317, "grad_norm": 0.19542875185819147, "learning_rate": 1.3963986004519885e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.10275737941265106, "step": 1940, "valid_targets_mean": 10406.6, "valid_targets_min": 5877 }, { "epoch": 3.1991223258365333, "grad_norm": 0.1732017772846815, "learning_rate": 1.385461592840939e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.1027611643075943, "step": 1945, "valid_targets_mean": 9535.4, "valid_targets_min": 3557 }, { "epoch": 3.2073505211190345, "grad_norm": 0.1882390427186111, "learning_rate": 1.3745448413099795e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.09596308320760727, "step": 1950, "valid_targets_mean": 9136.9, "valid_targets_min": 1343 }, { "epoch": 3.215578716401536, "grad_norm": 0.1810142486999098, "learning_rate": 1.3636487056911236e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.08757059276103973, "step": 1955, "valid_targets_mean": 9388.7, "valid_targets_min": 3282 }, { "epoch": 3.2238069116840373, "grad_norm": 0.18209264751554483, "learning_rate": 1.3527735451368567e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.0974527895450592, "step": 1960, "valid_targets_mean": 9729.2, "valid_targets_min": 3231 }, { "epoch": 3.2320351069665385, "grad_norm": 0.18591292208455748, "learning_rate": 1.3419197181082937e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.11141443252563477, "step": 1965, "valid_targets_mean": 10332.3, "valid_targets_min": 4344 }, { "epoch": 3.24026330224904, "grad_norm": 0.18085390289564288, "learning_rate": 1.3310875823633675e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.10907731205224991, "step": 1970, "valid_targets_mean": 11408.0, "valid_targets_min": 5726 }, { "epoch": 3.2484914975315413, "grad_norm": 0.1893653762416235, "learning_rate": 1.3202774949450326e-05, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.10792022943496704, "step": 1975, "valid_targets_mean": 10250.5, "valid_targets_min": 2607 }, { "epoch": 3.256719692814043, "grad_norm": 0.2029953340139833, "learning_rate": 1.3094898121695008e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.09804176539182663, "step": 1980, "valid_targets_mean": 9131.8, "valid_targets_min": 761 }, { "epoch": 3.264947888096544, "grad_norm": 0.1990065296907557, "learning_rate": 1.2987248896144915e-05, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.10255561023950577, "step": 1985, "valid_targets_mean": 10329.2, "valid_targets_min": 5291 }, { "epoch": 3.2731760833790453, "grad_norm": 0.19438225738776518, "learning_rate": 1.2879830821075174e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.09681476652622223, "step": 1990, "valid_targets_mean": 8999.2, "valid_targets_min": 2381 }, { "epoch": 3.281404278661547, "grad_norm": 0.18865449062923906, "learning_rate": 1.277264743714182e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.10528258979320526, "step": 1995, "valid_targets_mean": 9227.1, "valid_targets_min": 437 }, { "epoch": 3.289632473944048, "grad_norm": 0.20620698231027396, "learning_rate": 1.2665702277265168e-05, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.09422826766967773, "step": 2000, "valid_targets_mean": 9084.0, "valid_targets_min": 1451 }, { "epoch": 3.2978606692265497, "grad_norm": 0.18470245913703312, "learning_rate": 1.2558998866513283e-05, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.08594414591789246, "step": 2005, "valid_targets_mean": 9274.7, "valid_targets_min": 4259 }, { "epoch": 3.306088864509051, "grad_norm": 0.18549116063553767, "learning_rate": 1.245254072198585e-05, "loss": 0.2922, "loss_nan_ranks": 0, "loss_rank_avg": 0.09195162355899811, "step": 2010, "valid_targets_mean": 8931.9, "valid_targets_min": 410 }, { "epoch": 3.3143170597915526, "grad_norm": 0.1963520402334605, "learning_rate": 1.2346331352698206e-05, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.12253104895353317, "step": 2015, "valid_targets_mean": 11522.8, "valid_targets_min": 620 }, { "epoch": 3.3225452550740537, "grad_norm": 0.2583659342136034, "learning_rate": 1.224037425946571e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.10416905581951141, "step": 2020, "valid_targets_mean": 6154.2, "valid_targets_min": 386 }, { "epoch": 3.3307734503565554, "grad_norm": 0.24178543153686508, "learning_rate": 1.2134672934788338e-05, "loss": 0.3072, "loss_nan_ranks": 0, "loss_rank_avg": 0.1027805358171463, "step": 2025, "valid_targets_mean": 6070.9, "valid_targets_min": 2967 }, { "epoch": 3.3390016456390565, "grad_norm": 1.895090237361272, "learning_rate": 1.202923086273554e-05, "loss": 0.5715, "loss_nan_ranks": 0, "loss_rank_avg": 0.20451006293296814, "step": 2030, "valid_targets_mean": 3383.0, "valid_targets_min": 1270 }, { "epoch": 3.3472298409215577, "grad_norm": 0.7358808746545971, "learning_rate": 1.1924051518831444e-05, "loss": 0.6695, "loss_nan_ranks": 0, "loss_rank_avg": 0.16195747256278992, "step": 2035, "valid_targets_mean": 2937.2, "valid_targets_min": 1026 }, { "epoch": 3.3554580362040594, "grad_norm": 0.6745202805527456, "learning_rate": 1.1819138369940251e-05, "loss": 0.5868, "loss_nan_ranks": 0, "loss_rank_avg": 0.2747642397880554, "step": 2040, "valid_targets_mean": 4071.6, "valid_targets_min": 1539 }, { "epoch": 3.3636862314865605, "grad_norm": 0.3884525181714535, "learning_rate": 1.1714494874152025e-05, "loss": 0.5628, "loss_nan_ranks": 0, "loss_rank_avg": 0.18681445717811584, "step": 2045, "valid_targets_mean": 5239.0, "valid_targets_min": 1739 }, { "epoch": 3.371914426769062, "grad_norm": 0.3025604115847852, "learning_rate": 1.1610124480668636e-05, "loss": 0.5438, "loss_nan_ranks": 0, "loss_rank_avg": 0.1633882224559784, "step": 2050, "valid_targets_mean": 4039.2, "valid_targets_min": 1204 }, { "epoch": 3.3801426220515634, "grad_norm": 0.29935962744985817, "learning_rate": 1.1506030629690124e-05, "loss": 0.513, "loss_nan_ranks": 0, "loss_rank_avg": 0.1476593315601349, "step": 2055, "valid_targets_mean": 3473.9, "valid_targets_min": 1130 }, { "epoch": 3.3883708173340645, "grad_norm": 0.2901294118474583, "learning_rate": 1.140221675230127e-05, "loss": 0.5226, "loss_nan_ranks": 0, "loss_rank_avg": 0.155238538980484, "step": 2060, "valid_targets_mean": 3420.7, "valid_targets_min": 891 }, { "epoch": 3.396599012616566, "grad_norm": 0.31111984150155464, "learning_rate": 1.1298686270358542e-05, "loss": 0.5053, "loss_nan_ranks": 0, "loss_rank_avg": 0.22876670956611633, "step": 2065, "valid_targets_mean": 3772.6, "valid_targets_min": 1497 }, { "epoch": 3.4048272078990673, "grad_norm": 0.25109657866341767, "learning_rate": 1.1195442596377253e-05, "loss": 0.4982, "loss_nan_ranks": 0, "loss_rank_avg": 0.15915924310684204, "step": 2070, "valid_targets_mean": 4168.5, "valid_targets_min": 972 }, { "epoch": 3.413055403181569, "grad_norm": 0.2583604576475023, "learning_rate": 1.1092489133419137e-05, "loss": 0.4989, "loss_nan_ranks": 0, "loss_rank_avg": 0.11599528789520264, "step": 2075, "valid_targets_mean": 3252.4, "valid_targets_min": 636 }, { "epoch": 3.42128359846407, "grad_norm": 0.27203191468375026, "learning_rate": 1.0989829274980126e-05, "loss": 0.4889, "loss_nan_ranks": 0, "loss_rank_avg": 0.19358757138252258, "step": 2080, "valid_targets_mean": 4318.8, "valid_targets_min": 1103 }, { "epoch": 3.429511793746572, "grad_norm": 0.29509970677561226, "learning_rate": 1.088746640487854e-05, "loss": 0.505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1461564600467682, "step": 2085, "valid_targets_mean": 3735.0, "valid_targets_min": 1048 }, { "epoch": 3.437739989029073, "grad_norm": 0.30173358477297363, "learning_rate": 1.078540389714351e-05, "loss": 0.4832, "loss_nan_ranks": 0, "loss_rank_avg": 0.21707960963249207, "step": 2090, "valid_targets_mean": 4098.8, "valid_targets_min": 1319 }, { "epoch": 3.445968184311574, "grad_norm": 0.24353067059478417, "learning_rate": 1.0683645115903811e-05, "loss": 0.4899, "loss_nan_ranks": 0, "loss_rank_avg": 0.1496349275112152, "step": 2095, "valid_targets_mean": 4343.0, "valid_targets_min": 1454 }, { "epoch": 3.4541963795940758, "grad_norm": 0.2728265370581586, "learning_rate": 1.0582193415276931e-05, "loss": 0.5025, "loss_nan_ranks": 0, "loss_rank_avg": 0.14801722764968872, "step": 2100, "valid_targets_mean": 3758.9, "valid_targets_min": 1151 }, { "epoch": 3.462424574876577, "grad_norm": 0.27268401905899425, "learning_rate": 1.048105213925853e-05, "loss": 0.5072, "loss_nan_ranks": 0, "loss_rank_avg": 0.14311590790748596, "step": 2105, "valid_targets_mean": 3194.6, "valid_targets_min": 994 }, { "epoch": 3.4706527701590786, "grad_norm": 0.27509131095220457, "learning_rate": 1.0380224621612252e-05, "loss": 0.5125, "loss_nan_ranks": 0, "loss_rank_avg": 0.15198372304439545, "step": 2110, "valid_targets_mean": 3790.3, "valid_targets_min": 1391 }, { "epoch": 3.4788809654415798, "grad_norm": 0.2806449483852979, "learning_rate": 1.0279714185759771e-05, "loss": 0.4921, "loss_nan_ranks": 0, "loss_rank_avg": 0.2070062756538391, "step": 2115, "valid_targets_mean": 4685.3, "valid_targets_min": 822 }, { "epoch": 3.4871091607240814, "grad_norm": 0.2501045793083265, "learning_rate": 1.0179524144671315e-05, "loss": 0.4981, "loss_nan_ranks": 0, "loss_rank_avg": 0.13317403197288513, "step": 2120, "valid_targets_mean": 3750.0, "valid_targets_min": 1314 }, { "epoch": 3.4953373560065826, "grad_norm": 0.2653477626320092, "learning_rate": 1.0079657800756409e-05, "loss": 0.5039, "loss_nan_ranks": 0, "loss_rank_avg": 0.15906351804733276, "step": 2125, "valid_targets_mean": 4435.8, "valid_targets_min": 901 }, { "epoch": 3.5035655512890838, "grad_norm": 0.27270201439588876, "learning_rate": 9.980118445755072e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.05085363984107971, "step": 2130, "valid_targets_mean": 5312.0, "valid_targets_min": 2490 }, { "epoch": 3.5117937465715854, "grad_norm": 0.25850926643571376, "learning_rate": 9.880909360629265e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.052780479192733765, "step": 2135, "valid_targets_mean": 5549.4, "valid_targets_min": 3000 }, { "epoch": 3.5200219418540866, "grad_norm": 0.21165170628572016, "learning_rate": 9.782033815454806e-06, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.04313386231660843, "step": 2140, "valid_targets_mean": 5357.1, "valid_targets_min": 2787 }, { "epoch": 3.528250137136588, "grad_norm": 0.181714134126696, "learning_rate": 9.683495069313527e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.05347670614719391, "step": 2145, "valid_targets_mean": 5853.2, "valid_targets_min": 1305 }, { "epoch": 3.5364783324190894, "grad_norm": 0.19681955685226582, "learning_rate": 9.585296370185875e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.04260285198688507, "step": 2150, "valid_targets_mean": 5323.5, "valid_targets_min": 2609 }, { "epoch": 3.5447065277015906, "grad_norm": 0.18774837820824186, "learning_rate": 9.487440954843856e-06, "loss": 0.1299, "loss_nan_ranks": 0, "loss_rank_avg": 0.04370295628905296, "step": 2155, "valid_targets_mean": 5320.9, "valid_targets_min": 3076 }, { "epoch": 3.552934722984092, "grad_norm": 0.17697030654769377, "learning_rate": 9.38993204874436e-06, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.03998667374253273, "step": 2160, "valid_targets_mean": 5294.3, "valid_targets_min": 1502 }, { "epoch": 3.5611629182665934, "grad_norm": 0.17674626038431754, "learning_rate": 9.292772865922792e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.04547334834933281, "step": 2165, "valid_targets_mean": 5738.7, "valid_targets_min": 3508 }, { "epoch": 3.569391113549095, "grad_norm": 0.18303379919738216, "learning_rate": 9.195966608887212e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.040250808000564575, "step": 2170, "valid_targets_mean": 5052.5, "valid_targets_min": 2487 }, { "epoch": 3.577619308831596, "grad_norm": 0.18797337361410427, "learning_rate": 9.099516468512692e-06, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.04151705279946327, "step": 2175, "valid_targets_mean": 5108.5, "valid_targets_min": 3236 }, { "epoch": 3.585847504114098, "grad_norm": 0.17156816751481446, "learning_rate": 9.003425623936208e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.040634635835886, "step": 2180, "valid_targets_mean": 5397.8, "valid_targets_min": 2803 }, { "epoch": 3.594075699396599, "grad_norm": 0.18585953552751092, "learning_rate": 8.907697242451825e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.03988367319107056, "step": 2185, "valid_targets_mean": 5513.7, "valid_targets_min": 2867 }, { "epoch": 3.6023038946791006, "grad_norm": 0.18577716318480716, "learning_rate": 8.812334479406266e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.0442671924829483, "step": 2190, "valid_targets_mean": 5217.7, "valid_targets_min": 2433 }, { "epoch": 3.610532089961602, "grad_norm": 0.19363655736757662, "learning_rate": 8.71734047809498e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.040493179112672806, "step": 2195, "valid_targets_mean": 5169.1, "valid_targets_min": 2789 }, { "epoch": 3.618760285244103, "grad_norm": 0.16716286573436492, "learning_rate": 8.62271836965846e-06, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.04132536053657532, "step": 2200, "valid_targets_mean": 5809.1, "valid_targets_min": 2841 }, { "epoch": 3.6269884805266046, "grad_norm": 0.18637501105182114, "learning_rate": 8.528471272979083e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.04350794851779938, "step": 2205, "valid_targets_mean": 5502.1, "valid_targets_min": 2911 }, { "epoch": 3.635216675809106, "grad_norm": 0.19484985192773233, "learning_rate": 8.434602294578285e-06, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.04264716058969498, "step": 2210, "valid_targets_mean": 5274.9, "valid_targets_min": 2672 }, { "epoch": 3.6434448710916074, "grad_norm": 0.18319091175169402, "learning_rate": 8.341114528514192e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.04070258140563965, "step": 2215, "valid_targets_mean": 4966.8, "valid_targets_min": 2931 }, { "epoch": 3.6516730663741086, "grad_norm": 0.18406967880449163, "learning_rate": 8.248011056279588e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.04556259140372276, "step": 2220, "valid_targets_mean": 5898.0, "valid_targets_min": 3337 }, { "epoch": 3.65990126165661, "grad_norm": 0.19470458062154897, "learning_rate": 8.155294946700402e-06, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.043193720281124115, "step": 2225, "valid_targets_mean": 5214.2, "valid_targets_min": 2978 }, { "epoch": 3.6681294569391114, "grad_norm": 0.25333892509494665, "learning_rate": 8.062969255834505e-06, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.09117273986339569, "step": 2230, "valid_targets_mean": 3851.8, "valid_targets_min": 887 }, { "epoch": 3.6763576522216126, "grad_norm": 0.3855404264715868, "learning_rate": 7.971037026871016e-06, "loss": 0.4519, "loss_nan_ranks": 0, "loss_rank_avg": 0.1366964727640152, "step": 2235, "valid_targets_mean": 4596.2, "valid_targets_min": 1143 }, { "epoch": 3.684585847504114, "grad_norm": 0.2895125132387707, "learning_rate": 7.879501290029954e-06, "loss": 0.4387, "loss_nan_ranks": 0, "loss_rank_avg": 0.136347234249115, "step": 2240, "valid_targets_mean": 4087.0, "valid_targets_min": 1058 }, { "epoch": 3.6928140427866154, "grad_norm": 0.32375236588358164, "learning_rate": 7.788365062462411e-06, "loss": 0.4199, "loss_nan_ranks": 0, "loss_rank_avg": 0.1273779571056366, "step": 2245, "valid_targets_mean": 3146.8, "valid_targets_min": 960 }, { "epoch": 3.7010422380691166, "grad_norm": 0.2765774016675542, "learning_rate": 7.697631348151048e-06, "loss": 0.419, "loss_nan_ranks": 0, "loss_rank_avg": 0.14948008954524994, "step": 2250, "valid_targets_mean": 4243.4, "valid_targets_min": 890 }, { "epoch": 3.709270433351618, "grad_norm": 0.2405231497548994, "learning_rate": 7.607303137811108e-06, "loss": 0.3877, "loss_nan_ranks": 0, "loss_rank_avg": 0.10435382276773453, "step": 2255, "valid_targets_mean": 4787.6, "valid_targets_min": 989 }, { "epoch": 3.71749862863412, "grad_norm": 0.28959377843811446, "learning_rate": 7.517383408791847e-06, "loss": 0.4175, "loss_nan_ranks": 0, "loss_rank_avg": 0.1839148998260498, "step": 2260, "valid_targets_mean": 4654.7, "valid_targets_min": 385 }, { "epoch": 3.725726823916621, "grad_norm": 0.27304162379886376, "learning_rate": 7.427875124978359e-06, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.13247811794281006, "step": 2265, "valid_targets_mean": 3702.7, "valid_targets_min": 1391 }, { "epoch": 3.733955019199122, "grad_norm": 0.30525674061003377, "learning_rate": 7.33878123669393e-06, "loss": 0.3865, "loss_nan_ranks": 0, "loss_rank_avg": 0.13155576586723328, "step": 2270, "valid_targets_mean": 3575.6, "valid_targets_min": 1115 }, { "epoch": 3.742183214481624, "grad_norm": 0.23940187715657524, "learning_rate": 7.2501046806027456e-06, "loss": 0.41, "loss_nan_ranks": 0, "loss_rank_avg": 0.11278781294822693, "step": 2275, "valid_targets_mean": 3883.8, "valid_targets_min": 1256 }, { "epoch": 3.750411409764125, "grad_norm": 0.26157914151130646, "learning_rate": 7.161848379613134e-06, "loss": 0.394, "loss_nan_ranks": 0, "loss_rank_avg": 0.11556685715913773, "step": 2280, "valid_targets_mean": 4064.0, "valid_targets_min": 1346 }, { "epoch": 3.7586396050466266, "grad_norm": 0.2754096668324058, "learning_rate": 7.074015242781181e-06, "loss": 0.4103, "loss_nan_ranks": 0, "loss_rank_avg": 0.136755108833313, "step": 2285, "valid_targets_mean": 3096.2, "valid_targets_min": 695 }, { "epoch": 3.766867800329128, "grad_norm": 0.2673295797880238, "learning_rate": 6.986608165214892e-06, "loss": 0.3874, "loss_nan_ranks": 0, "loss_rank_avg": 0.13044080138206482, "step": 2290, "valid_targets_mean": 3573.1, "valid_targets_min": 1272 }, { "epoch": 3.775095995611629, "grad_norm": 0.24565165248996393, "learning_rate": 6.899630027978717e-06, "loss": 0.3862, "loss_nan_ranks": 0, "loss_rank_avg": 0.11896165460348129, "step": 2295, "valid_targets_mean": 4696.2, "valid_targets_min": 939 }, { "epoch": 3.7833241908941306, "grad_norm": 0.26076112407188706, "learning_rate": 6.8130836979986236e-06, "loss": 0.4288, "loss_nan_ranks": 0, "loss_rank_avg": 0.1774311065673828, "step": 2300, "valid_targets_mean": 4314.5, "valid_targets_min": 1135 }, { "epoch": 3.791552386176632, "grad_norm": 0.26624764344340895, "learning_rate": 6.7269720279675755e-06, "loss": 0.3908, "loss_nan_ranks": 0, "loss_rank_avg": 0.1311570405960083, "step": 2305, "valid_targets_mean": 3551.0, "valid_targets_min": 909 }, { "epoch": 3.7997805814591334, "grad_norm": 0.27025205393210866, "learning_rate": 6.641297856251514e-06, "loss": 0.4191, "loss_nan_ranks": 0, "loss_rank_avg": 0.134062260389328, "step": 2310, "valid_targets_mean": 3728.1, "valid_targets_min": 970 }, { "epoch": 3.8080087767416346, "grad_norm": 0.24904092712840964, "learning_rate": 6.556064006795795e-06, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.1097637414932251, "step": 2315, "valid_targets_mean": 3462.3, "valid_targets_min": 1420 }, { "epoch": 3.816236972024136, "grad_norm": 0.24275402888828918, "learning_rate": 6.471273289032125e-06, "loss": 0.4029, "loss_nan_ranks": 0, "loss_rank_avg": 0.1297762244939804, "step": 2320, "valid_targets_mean": 4587.7, "valid_targets_min": 1133 }, { "epoch": 3.8244651673066374, "grad_norm": 0.2654856935959466, "learning_rate": 6.386928497785929e-06, "loss": 0.3892, "loss_nan_ranks": 0, "loss_rank_avg": 0.1179320216178894, "step": 2325, "valid_targets_mean": 3638.8, "valid_targets_min": 1166 }, { "epoch": 3.8326933625891386, "grad_norm": 0.2648669254710519, "learning_rate": 6.303032413184256e-06, "loss": 0.4142, "loss_nan_ranks": 0, "loss_rank_avg": 0.13473305106163025, "step": 2330, "valid_targets_mean": 4151.9, "valid_targets_min": 1404 }, { "epoch": 3.8409215578716402, "grad_norm": 0.25274953101806685, "learning_rate": 6.219587800564135e-06, "loss": 0.3908, "loss_nan_ranks": 0, "loss_rank_avg": 0.07814621180295944, "step": 2335, "valid_targets_mean": 1979.0, "valid_targets_min": 506 }, { "epoch": 3.8491497531541414, "grad_norm": 0.2799408422446661, "learning_rate": 6.136597410381404e-06, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.0938805416226387, "step": 2340, "valid_targets_mean": 6913.1, "valid_targets_min": 817 }, { "epoch": 3.857377948436643, "grad_norm": 0.2128799029136465, "learning_rate": 6.054063978120093e-06, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.08730052411556244, "step": 2345, "valid_targets_mean": 6177.3, "valid_targets_min": 509 }, { "epoch": 3.8656061437191442, "grad_norm": 0.20296058207505324, "learning_rate": 5.971990224202209e-06, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.08442901074886322, "step": 2350, "valid_targets_mean": 6737.9, "valid_targets_min": 1241 }, { "epoch": 3.873834339001646, "grad_norm": 0.17908986617598158, "learning_rate": 5.890378853898106e-06, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.09330446273088455, "step": 2355, "valid_targets_mean": 7625.8, "valid_targets_min": 597 }, { "epoch": 3.882062534284147, "grad_norm": 0.24834625855840978, "learning_rate": 5.809232557237292e-06, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.1216353327035904, "step": 2360, "valid_targets_mean": 6605.6, "valid_targets_min": 335 }, { "epoch": 3.8902907295666482, "grad_norm": 0.17101902840906216, "learning_rate": 5.728554008919794e-06, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.08080480992794037, "step": 2365, "valid_targets_mean": 6378.9, "valid_targets_min": 281 }, { "epoch": 3.89851892484915, "grad_norm": 0.17341671996138142, "learning_rate": 5.6483458682279354e-06, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.06936435401439667, "step": 2370, "valid_targets_mean": 5468.6, "valid_targets_min": 543 }, { "epoch": 3.906747120131651, "grad_norm": 0.16456626810742647, "learning_rate": 5.568610778938761e-06, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.07711958140134811, "step": 2375, "valid_targets_mean": 6290.5, "valid_targets_min": 301 }, { "epoch": 3.9149753154141527, "grad_norm": 0.1695584593994994, "learning_rate": 5.489351369236817e-06, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.05445744842290878, "step": 2380, "valid_targets_mean": 4845.6, "valid_targets_min": 401 }, { "epoch": 3.923203510696654, "grad_norm": 0.1800936264070191, "learning_rate": 5.410570251627587e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.08194078505039215, "step": 2385, "valid_targets_mean": 6736.4, "valid_targets_min": 134 }, { "epoch": 3.931431705979155, "grad_norm": 0.174046744890005, "learning_rate": 5.332270022851327e-06, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.09117108583450317, "step": 2390, "valid_targets_mean": 7333.2, "valid_targets_min": 1427 }, { "epoch": 3.9396599012616567, "grad_norm": 0.2458671161035671, "learning_rate": 5.254453263797521e-06, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.04853862524032593, "step": 2395, "valid_targets_mean": 1272.8, "valid_targets_min": 374 }, { "epoch": 3.947888096544158, "grad_norm": 0.26767848712622627, "learning_rate": 5.177122539419763e-06, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.0782180204987526, "step": 2400, "valid_targets_mean": 6596.2, "valid_targets_min": 491 }, { "epoch": 3.9561162918266595, "grad_norm": 0.16636456794257964, "learning_rate": 5.10028039865126e-06, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.05681359022855759, "step": 2405, "valid_targets_mean": 5984.0, "valid_targets_min": 350 }, { "epoch": 3.9643444871091607, "grad_norm": 0.1766915803923583, "learning_rate": 5.023929374320779e-06, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.08463890850543976, "step": 2410, "valid_targets_mean": 6808.1, "valid_targets_min": 367 }, { "epoch": 3.972572682391662, "grad_norm": 0.18083090564134296, "learning_rate": 4.948071983069167e-06, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.08655136823654175, "step": 2415, "valid_targets_mean": 6776.0, "valid_targets_min": 475 }, { "epoch": 3.9808008776741635, "grad_norm": 0.2150095285524866, "learning_rate": 4.8727107252664315e-06, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.10201592743396759, "step": 2420, "valid_targets_mean": 7100.5, "valid_targets_min": 370 }, { "epoch": 3.989029072956665, "grad_norm": 0.1714470668143074, "learning_rate": 4.797848084929271e-06, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.06286249309778214, "step": 2425, "valid_targets_mean": 5628.6, "valid_targets_min": 503 }, { "epoch": 3.9972572682391663, "grad_norm": 0.16916735134740704, "learning_rate": 4.723486529639252e-06, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.08586841821670532, "step": 2430, "valid_targets_mean": 6859.2, "valid_targets_min": 578 }, { "epoch": 4.004936917169501, "grad_norm": 2.336956202835139, "learning_rate": 4.649628510461428e-06, "loss": 0.514, "loss_nan_ranks": 0, "loss_rank_avg": 0.21151629090309143, "step": 2435, "valid_targets_mean": 7854.0, "valid_targets_min": 2676 }, { "epoch": 4.013165112452002, "grad_norm": 1.41923931878634, "learning_rate": 4.576276461863589e-06, "loss": 0.5277, "loss_nan_ranks": 0, "loss_rank_avg": 0.15032610297203064, "step": 2440, "valid_targets_mean": 6740.2, "valid_targets_min": 3017 }, { "epoch": 4.021393307734503, "grad_norm": 0.8500945954778326, "learning_rate": 4.503432801635976e-06, "loss": 0.46, "loss_nan_ranks": 0, "loss_rank_avg": 0.13372503221035004, "step": 2445, "valid_targets_mean": 7294.2, "valid_targets_min": 3200 }, { "epoch": 4.029621503017005, "grad_norm": 0.6004641788267427, "learning_rate": 4.431099930811633e-06, "loss": 0.4076, "loss_nan_ranks": 0, "loss_rank_avg": 0.14208507537841797, "step": 2450, "valid_targets_mean": 7212.2, "valid_targets_min": 2554 }, { "epoch": 4.037849698299507, "grad_norm": 0.46434648019740743, "learning_rate": 4.359280233587229e-06, "loss": 0.3746, "loss_nan_ranks": 0, "loss_rank_avg": 0.12539725005626678, "step": 2455, "valid_targets_mean": 7016.0, "valid_targets_min": 2429 }, { "epoch": 4.046077893582008, "grad_norm": 0.3135597964334871, "learning_rate": 4.28797607724448e-06, "loss": 0.3607, "loss_nan_ranks": 0, "loss_rank_avg": 0.11195516586303711, "step": 2460, "valid_targets_mean": 7897.7, "valid_targets_min": 2091 }, { "epoch": 4.054306088864509, "grad_norm": 0.26939488289825964, "learning_rate": 4.217189812072131e-06, "loss": 0.3497, "loss_nan_ranks": 0, "loss_rank_avg": 0.12193445861339569, "step": 2465, "valid_targets_mean": 7362.4, "valid_targets_min": 1674 }, { "epoch": 4.06253428414701, "grad_norm": 0.26655830700455374, "learning_rate": 4.146923771288489e-06, "loss": 0.336, "loss_nan_ranks": 0, "loss_rank_avg": 0.11060521006584167, "step": 2470, "valid_targets_mean": 6896.6, "valid_targets_min": 2522 }, { "epoch": 4.070762479429511, "grad_norm": 0.21602585425107565, "learning_rate": 4.077180270964487e-06, "loss": 0.3354, "loss_nan_ranks": 0, "loss_rank_avg": 0.10641120374202728, "step": 2475, "valid_targets_mean": 7470.7, "valid_targets_min": 2790 }, { "epoch": 4.0789906747120135, "grad_norm": 0.19078412445817078, "learning_rate": 4.007961609947391e-06, "loss": 0.3356, "loss_nan_ranks": 0, "loss_rank_avg": 0.11443803459405899, "step": 2480, "valid_targets_mean": 8266.8, "valid_targets_min": 3307 }, { "epoch": 4.087218869994515, "grad_norm": 0.2034314805463107, "learning_rate": 3.93927006978497e-06, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.09000586718320847, "step": 2485, "valid_targets_mean": 8286.0, "valid_targets_min": 325 }, { "epoch": 4.095447065277016, "grad_norm": 0.1845196550420189, "learning_rate": 3.8711079146503474e-06, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.10727182030677795, "step": 2490, "valid_targets_mean": 9267.8, "valid_targets_min": 5215 }, { "epoch": 4.103675260559517, "grad_norm": 0.17034619427285855, "learning_rate": 3.8034773912673383e-06, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.10079951584339142, "step": 2495, "valid_targets_mean": 9206.4, "valid_targets_min": 3552 }, { "epoch": 4.111903455842018, "grad_norm": 0.16544617657311927, "learning_rate": 3.736380728836393e-06, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.1036929041147232, "step": 2500, "valid_targets_mean": 9805.0, "valid_targets_min": 435 }, { "epoch": 4.12013165112452, "grad_norm": 0.1675109415038507, "learning_rate": 3.6698201389611423e-06, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.10505664348602295, "step": 2505, "valid_targets_mean": 9971.8, "valid_targets_min": 3896 }, { "epoch": 4.1283598464070215, "grad_norm": 0.17732216459505157, "learning_rate": 3.6037978155754737e-06, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.09879560768604279, "step": 2510, "valid_targets_mean": 9100.1, "valid_targets_min": 3598 }, { "epoch": 4.136588041689523, "grad_norm": 0.17652461132533978, "learning_rate": 3.53831593487123e-06, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.09788352251052856, "step": 2515, "valid_targets_mean": 9095.8, "valid_targets_min": 3870 }, { "epoch": 4.144816236972024, "grad_norm": 0.1751708078026008, "learning_rate": 3.473376655226479e-06, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.09423353523015976, "step": 2520, "valid_targets_mean": 8719.1, "valid_targets_min": 3803 }, { "epoch": 4.153044432254526, "grad_norm": 0.1617553991074427, "learning_rate": 3.408982117134374e-06, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.10206412523984909, "step": 2525, "valid_targets_mean": 9952.8, "valid_targets_min": 703 }, { "epoch": 4.161272627537027, "grad_norm": 0.17010544092490168, "learning_rate": 3.3451344431325806e-06, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.09758783876895905, "step": 2530, "valid_targets_mean": 9790.2, "valid_targets_min": 1990 }, { "epoch": 4.169500822819528, "grad_norm": 0.1759410398694626, "learning_rate": 3.2818357377333455e-06, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.09575256705284119, "step": 2535, "valid_targets_mean": 9145.0, "valid_targets_min": 3036 }, { "epoch": 4.1777290181020295, "grad_norm": 0.16216951102404267, "learning_rate": 3.219088087354092e-06, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.08874919265508652, "step": 2540, "valid_targets_mean": 9393.3, "valid_targets_min": 749 }, { "epoch": 4.185957213384531, "grad_norm": 0.1633207914795439, "learning_rate": 3.156893560248688e-06, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.08750354498624802, "step": 2545, "valid_targets_mean": 8753.6, "valid_targets_min": 721 }, { "epoch": 4.194185408667033, "grad_norm": 0.17268830072169394, "learning_rate": 3.095254206439233e-06, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.09792269021272659, "step": 2550, "valid_targets_mean": 9578.5, "valid_targets_min": 2306 }, { "epoch": 4.202413603949534, "grad_norm": 0.1631186432521016, "learning_rate": 3.0341720576485277e-06, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.09698028117418289, "step": 2555, "valid_targets_mean": 9520.8, "valid_targets_min": 4270 }, { "epoch": 4.210641799232035, "grad_norm": 0.1635172649108156, "learning_rate": 2.9736491272330694e-06, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.10328608751296997, "step": 2560, "valid_targets_mean": 10044.1, "valid_targets_min": 5057 }, { "epoch": 4.218869994514536, "grad_norm": 0.1588271104676105, "learning_rate": 2.9136874101167034e-06, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.09239079058170319, "step": 2565, "valid_targets_mean": 9430.1, "valid_targets_min": 4478 }, { "epoch": 4.227098189797037, "grad_norm": 0.15675985150107885, "learning_rate": 2.854288882724885e-06, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.09478726983070374, "step": 2570, "valid_targets_mean": 9906.8, "valid_targets_min": 4602 }, { "epoch": 4.2353263850795395, "grad_norm": 0.15893873290014987, "learning_rate": 2.795455502919493e-06, "loss": 0.2877, "loss_nan_ranks": 0, "loss_rank_avg": 0.09879006445407867, "step": 2575, "valid_targets_mean": 9816.9, "valid_targets_min": 600 }, { "epoch": 4.243554580362041, "grad_norm": 0.16008381725374082, "learning_rate": 2.7371892099343455e-06, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.09585876762866974, "step": 2580, "valid_targets_mean": 9615.7, "valid_targets_min": 321 }, { "epoch": 4.251782775644542, "grad_norm": 0.16240540291320715, "learning_rate": 2.679491924311226e-06, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.09075018763542175, "step": 2585, "valid_targets_mean": 9669.4, "valid_targets_min": 4373 }, { "epoch": 4.260010970927043, "grad_norm": 0.16123315756596274, "learning_rate": 2.622365547836636e-06, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.10122531652450562, "step": 2590, "valid_targets_mean": 10030.3, "valid_targets_min": 4760 }, { "epoch": 4.268239166209545, "grad_norm": 0.1614050818709832, "learning_rate": 2.5658119634790526e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.09613090753555298, "step": 2595, "valid_targets_mean": 9881.2, "valid_targets_min": 4785 }, { "epoch": 4.276467361492046, "grad_norm": 0.16136146793987857, "learning_rate": 2.5098330353269164e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.09504969418048859, "step": 2600, "valid_targets_mean": 9669.7, "valid_targets_min": 3932 }, { "epoch": 4.2846955567745475, "grad_norm": 0.16203287980747294, "learning_rate": 2.4544306085271406e-06, "loss": 0.2843, "loss_nan_ranks": 0, "loss_rank_avg": 0.09451472014188766, "step": 2605, "valid_targets_mean": 9425.6, "valid_targets_min": 3063 }, { "epoch": 4.292923752057049, "grad_norm": 0.1664226870010622, "learning_rate": 2.399606509224337e-06, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.10325511544942856, "step": 2610, "valid_targets_mean": 9942.2, "valid_targets_min": 3468 }, { "epoch": 4.30115194733955, "grad_norm": 0.16319711424290925, "learning_rate": 2.345362544500589e-06, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.09199801087379456, "step": 2615, "valid_targets_mean": 9693.8, "valid_targets_min": 562 }, { "epoch": 4.309380142622052, "grad_norm": 0.16661531597560844, "learning_rate": 2.2917005023158966e-06, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.10052244365215302, "step": 2620, "valid_targets_mean": 10011.0, "valid_targets_min": 3774 }, { "epoch": 4.317608337904553, "grad_norm": 0.18510374807764027, "learning_rate": 2.2386221514492502e-06, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.06400661915540695, "step": 2625, "valid_targets_mean": 5209.4, "valid_targets_min": 484 }, { "epoch": 4.325836533187054, "grad_norm": 0.22137356711405826, "learning_rate": 2.186129241440336e-06, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.09740819036960602, "step": 2630, "valid_targets_mean": 6386.3, "valid_targets_min": 3796 }, { "epoch": 4.3340647284695555, "grad_norm": 0.23070165597543357, "learning_rate": 2.134223502531838e-06, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.10796046257019043, "step": 2635, "valid_targets_mean": 6407.3, "valid_targets_min": 2561 }, { "epoch": 4.342292923752057, "grad_norm": 1.634978861513987, "learning_rate": 2.0829066456124415e-06, "loss": 0.6808, "loss_nan_ranks": 0, "loss_rank_avg": 0.21645402908325195, "step": 2640, "valid_targets_mean": 4497.1, "valid_targets_min": 1348 }, { "epoch": 4.350521119034559, "grad_norm": 1.2882498753330385, "learning_rate": 2.032180362160423e-06, "loss": 0.6324, "loss_nan_ranks": 0, "loss_rank_avg": 0.17659324407577515, "step": 2645, "valid_targets_mean": 4428.4, "valid_targets_min": 1031 }, { "epoch": 4.35874931431706, "grad_norm": 1.043040981513531, "learning_rate": 1.9820463241878873e-06, "loss": 0.62, "loss_nan_ranks": 0, "loss_rank_avg": 0.22026868164539337, "step": 2650, "valid_targets_mean": 3730.1, "valid_targets_min": 827 }, { "epoch": 4.366977509599561, "grad_norm": 0.6949809377584997, "learning_rate": 1.9325061841856808e-06, "loss": 0.5603, "loss_nan_ranks": 0, "loss_rank_avg": 0.21149209141731262, "step": 2655, "valid_targets_mean": 4497.8, "valid_targets_min": 1422 }, { "epoch": 4.375205704882062, "grad_norm": 0.5381576597915756, "learning_rate": 1.8835615750688997e-06, "loss": 0.5239, "loss_nan_ranks": 0, "loss_rank_avg": 0.14553728699684143, "step": 2660, "valid_targets_mean": 2116.2, "valid_targets_min": 785 }, { "epoch": 4.3834339001645635, "grad_norm": 0.3521266371539034, "learning_rate": 1.8352141101230758e-06, "loss": 0.5108, "loss_nan_ranks": 0, "loss_rank_avg": 0.15841825306415558, "step": 2665, "valid_targets_mean": 4756.1, "valid_targets_min": 1301 }, { "epoch": 4.3916620954470655, "grad_norm": 0.2892377482447778, "learning_rate": 1.787465382950999e-06, "loss": 0.4972, "loss_nan_ranks": 0, "loss_rank_avg": 0.15879112482070923, "step": 2670, "valid_targets_mean": 4760.8, "valid_targets_min": 758 }, { "epoch": 4.399890290729567, "grad_norm": 0.31603860554853436, "learning_rate": 1.7403169674202036e-06, "loss": 0.5039, "loss_nan_ranks": 0, "loss_rank_avg": 0.16973236203193665, "step": 2675, "valid_targets_mean": 3936.6, "valid_targets_min": 1412 }, { "epoch": 4.408118486012068, "grad_norm": 0.31041708575716764, "learning_rate": 1.6937704176110582e-06, "loss": 0.4889, "loss_nan_ranks": 0, "loss_rank_avg": 0.175504669547081, "step": 2680, "valid_targets_mean": 4049.9, "valid_targets_min": 928 }, { "epoch": 4.416346681294569, "grad_norm": 0.31096923174048335, "learning_rate": 1.6478272677655804e-06, "loss": 0.4648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1734139621257782, "step": 2685, "valid_targets_mean": 3266.9, "valid_targets_min": 782 }, { "epoch": 4.424574876577071, "grad_norm": 0.24393298018131654, "learning_rate": 1.6024890322368358e-06, "loss": 0.4778, "loss_nan_ranks": 0, "loss_rank_avg": 0.16197149455547333, "step": 2690, "valid_targets_mean": 4822.6, "valid_targets_min": 1093 }, { "epoch": 4.432803071859572, "grad_norm": 0.2514174477374428, "learning_rate": 1.5577572054390388e-06, "loss": 0.4799, "loss_nan_ranks": 0, "loss_rank_avg": 0.14338165521621704, "step": 2695, "valid_targets_mean": 3932.0, "valid_targets_min": 1179 }, { "epoch": 4.4410312671420735, "grad_norm": 0.26955755821506955, "learning_rate": 1.5136332617982863e-06, "loss": 0.4633, "loss_nan_ranks": 0, "loss_rank_avg": 0.16022084653377533, "step": 2700, "valid_targets_mean": 3117.2, "valid_targets_min": 1152 }, { "epoch": 4.449259462424575, "grad_norm": 0.2573136431453555, "learning_rate": 1.4701186557039648e-06, "loss": 0.4941, "loss_nan_ranks": 0, "loss_rank_avg": 0.13580411672592163, "step": 2705, "valid_targets_mean": 3402.1, "valid_targets_min": 1357 }, { "epoch": 4.457487657707076, "grad_norm": 0.38826071621804453, "learning_rate": 1.4272148214608073e-06, "loss": 0.4766, "loss_nan_ranks": 0, "loss_rank_avg": 0.2044774889945984, "step": 2710, "valid_targets_mean": 3427.9, "valid_targets_min": 1115 }, { "epoch": 4.465715852989578, "grad_norm": 0.227099580695401, "learning_rate": 1.384923173241619e-06, "loss": 0.4828, "loss_nan_ranks": 0, "loss_rank_avg": 0.14953580498695374, "step": 2715, "valid_targets_mean": 4640.0, "valid_targets_min": 1563 }, { "epoch": 4.473944048272079, "grad_norm": 0.22830741711269528, "learning_rate": 1.3432451050406603e-06, "loss": 0.4872, "loss_nan_ranks": 0, "loss_rank_avg": 0.15632256865501404, "step": 2720, "valid_targets_mean": 3996.0, "valid_targets_min": 1296 }, { "epoch": 4.48217224355458, "grad_norm": 0.2507077891470695, "learning_rate": 1.3021819906277021e-06, "loss": 0.4717, "loss_nan_ranks": 0, "loss_rank_avg": 0.148903489112854, "step": 2725, "valid_targets_mean": 3636.5, "valid_targets_min": 1273 }, { "epoch": 4.4904004388370815, "grad_norm": 0.2604213246216982, "learning_rate": 1.2617351835027481e-06, "loss": 0.5015, "loss_nan_ranks": 0, "loss_rank_avg": 0.16615310311317444, "step": 2730, "valid_targets_mean": 3391.8, "valid_targets_min": 1536 }, { "epoch": 4.498628634119583, "grad_norm": 0.42603564994275517, "learning_rate": 1.2219060168514086e-06, "loss": 0.4304, "loss_nan_ranks": 0, "loss_rank_avg": 0.09591139853000641, "step": 2735, "valid_targets_mean": 5537.1, "valid_targets_min": 2564 }, { "epoch": 4.506856829402085, "grad_norm": 0.44103615162619425, "learning_rate": 1.1826958035009773e-06, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.054220978170633316, "step": 2740, "valid_targets_mean": 5478.3, "valid_targets_min": 2226 }, { "epoch": 4.515085024684586, "grad_norm": 0.28894591073573966, "learning_rate": 1.1441058358771317e-06, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.04055090993642807, "step": 2745, "valid_targets_mean": 4935.5, "valid_targets_min": 2518 }, { "epoch": 4.523313219967087, "grad_norm": 0.23637425110289348, "learning_rate": 1.1061373859613634e-06, "loss": 0.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.045938000082969666, "step": 2750, "valid_targets_mean": 5529.9, "valid_targets_min": 3140 }, { "epoch": 4.531541415249588, "grad_norm": 0.21800711396947803, "learning_rate": 1.0687917052490193e-06, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.039560433477163315, "step": 2755, "valid_targets_mean": 4935.2, "valid_targets_min": 2984 }, { "epoch": 4.53976961053209, "grad_norm": 0.197365764296847, "learning_rate": 1.032070024708085e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.039238572120666504, "step": 2760, "valid_targets_mean": 4934.8, "valid_targets_min": 2648 }, { "epoch": 4.547997805814592, "grad_norm": 0.18608496032386362, "learning_rate": 9.959735547385762e-07, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.04007216915488243, "step": 2765, "valid_targets_mean": 5136.8, "valid_targets_min": 2159 }, { "epoch": 4.556226001097093, "grad_norm": 0.1728807254072536, "learning_rate": 9.605034851326644e-07, "loss": 0.124, "loss_nan_ranks": 0, "loss_rank_avg": 0.038183607161045074, "step": 2770, "valid_targets_mean": 5029.4, "valid_targets_min": 2963 }, { "epoch": 4.564454196379594, "grad_norm": 0.19435780088328164, "learning_rate": 9.256609850354636e-07, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.04276277869939804, "step": 2775, "valid_targets_mean": 5930.7, "valid_targets_min": 2714 }, { "epoch": 4.572682391662095, "grad_norm": 0.17792201797210133, "learning_rate": 8.91447202906468e-07, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.03755832463502884, "step": 2780, "valid_targets_mean": 5439.3, "valid_targets_min": 2668 }, { "epoch": 4.580910586944597, "grad_norm": 0.1662125580893836, "learning_rate": 8.578632664817177e-07, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.03744211420416832, "step": 2785, "valid_targets_mean": 5153.3, "valid_targets_min": 2730 }, { "epoch": 4.589138782227098, "grad_norm": 0.18003515710383633, "learning_rate": 8.249102827366306e-07, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.045447975397109985, "step": 2790, "valid_targets_mean": 5870.0, "valid_targets_min": 3065 }, { "epoch": 4.5973669775095996, "grad_norm": 0.16711301896155625, "learning_rate": 7.925893378494942e-07, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.041192252188920975, "step": 2795, "valid_targets_mean": 5658.6, "valid_targets_min": 2803 }, { "epoch": 4.605595172792101, "grad_norm": 0.1852534235518299, "learning_rate": 7.609014971656803e-07, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.03670789301395416, "step": 2800, "valid_targets_mean": 5224.7, "valid_targets_min": 2628 }, { "epoch": 4.613823368074602, "grad_norm": 0.16950321374451233, "learning_rate": 7.298478051625335e-07, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.04173382371664047, "step": 2805, "valid_targets_mean": 5735.1, "valid_targets_min": 3533 }, { "epoch": 4.622051563357104, "grad_norm": 0.17829538445378323, "learning_rate": 6.994292854149165e-07, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.038754336535930634, "step": 2810, "valid_targets_mean": 5265.8, "valid_targets_min": 2050 }, { "epoch": 4.630279758639605, "grad_norm": 0.17636268345082917, "learning_rate": 6.696469405615102e-07, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.04200731962919235, "step": 2815, "valid_targets_mean": 5609.0, "valid_targets_min": 3609 }, { "epoch": 4.638507953922106, "grad_norm": 0.1829464386645835, "learning_rate": 6.405017522717316e-07, "loss": 0.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.037692733108997345, "step": 2820, "valid_targets_mean": 5324.1, "valid_targets_min": 1713 }, { "epoch": 4.6467361492046075, "grad_norm": 0.18881807104757656, "learning_rate": 6.119946812133926e-07, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.03966955095529556, "step": 2825, "valid_targets_mean": 4990.3, "valid_targets_min": 665 }, { "epoch": 4.654964344487109, "grad_norm": 0.18184605173434396, "learning_rate": 5.841266670210366e-07, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.03901213780045509, "step": 2830, "valid_targets_mean": 5599.9, "valid_targets_min": 2657 }, { "epoch": 4.663192539769611, "grad_norm": 0.18166398336136586, "learning_rate": 5.568986282649636e-07, "loss": 0.1144, "loss_nan_ranks": 0, "loss_rank_avg": 0.04104125499725342, "step": 2835, "valid_targets_mean": 5342.1, "valid_targets_min": 2880 }, { "epoch": 4.671420735052112, "grad_norm": 0.6466547891111, "learning_rate": 5.303114624209449e-07, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.1742110550403595, "step": 2840, "valid_targets_mean": 3803.8, "valid_targets_min": 1361 }, { "epoch": 4.679648930334613, "grad_norm": 0.5463616335992676, "learning_rate": 5.043660458406563e-07, "loss": 0.4345, "loss_nan_ranks": 0, "loss_rank_avg": 0.14823535084724426, "step": 2845, "valid_targets_mean": 4280.1, "valid_targets_min": 341 }, { "epoch": 4.687877125617114, "grad_norm": 0.42219045429720925, "learning_rate": 4.790632337227785e-07, "loss": 0.4006, "loss_nan_ranks": 0, "loss_rank_avg": 0.11169308423995972, "step": 2850, "valid_targets_mean": 4561.8, "valid_targets_min": 1051 }, { "epoch": 4.6961053208996155, "grad_norm": 0.36411612300260526, "learning_rate": 4.544038600848155e-07, "loss": 0.4252, "loss_nan_ranks": 0, "loss_rank_avg": 0.14665555953979492, "step": 2855, "valid_targets_mean": 3689.7, "valid_targets_min": 1235 }, { "epoch": 4.704333516182118, "grad_norm": 0.30679805398991083, "learning_rate": 4.303887377356053e-07, "loss": 0.3976, "loss_nan_ranks": 0, "loss_rank_avg": 0.11447066068649292, "step": 2860, "valid_targets_mean": 3426.4, "valid_targets_min": 974 }, { "epoch": 4.712561711464619, "grad_norm": 0.3123137521770701, "learning_rate": 4.070186582485214e-07, "loss": 0.396, "loss_nan_ranks": 0, "loss_rank_avg": 0.1737116575241089, "step": 2865, "valid_targets_mean": 3986.3, "valid_targets_min": 1079 }, { "epoch": 4.72078990674712, "grad_norm": 0.26330053899557904, "learning_rate": 3.842943919353914e-07, "loss": 0.3833, "loss_nan_ranks": 0, "loss_rank_avg": 0.11449083685874939, "step": 2870, "valid_targets_mean": 3593.2, "valid_targets_min": 926 }, { "epoch": 4.729018102029621, "grad_norm": 0.2556769576018494, "learning_rate": 3.6221668782109534e-07, "loss": 0.375, "loss_nan_ranks": 0, "loss_rank_avg": 0.11261357367038727, "step": 2875, "valid_targets_mean": 3480.5, "valid_targets_min": 1151 }, { "epoch": 4.737246297312123, "grad_norm": 0.2669807142158802, "learning_rate": 3.4078627361888717e-07, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.14366257190704346, "step": 2880, "valid_targets_mean": 3933.4, "valid_targets_min": 1036 }, { "epoch": 4.745474492594624, "grad_norm": 0.2664773916564826, "learning_rate": 3.2000385570640114e-07, "loss": 0.3869, "loss_nan_ranks": 0, "loss_rank_avg": 0.12738540768623352, "step": 2885, "valid_targets_mean": 3254.5, "valid_targets_min": 1190 }, { "epoch": 4.753702687877126, "grad_norm": 0.23815293184151845, "learning_rate": 2.998701191023701e-07, "loss": 0.3684, "loss_nan_ranks": 0, "loss_rank_avg": 0.09321914613246918, "step": 2890, "valid_targets_mean": 3184.5, "valid_targets_min": 627 }, { "epoch": 4.761930883159627, "grad_norm": 0.2341598205900795, "learning_rate": 2.80385727444048e-07, "loss": 0.3995, "loss_nan_ranks": 0, "loss_rank_avg": 0.12059900164604187, "step": 2895, "valid_targets_mean": 4686.7, "valid_targets_min": 1218 }, { "epoch": 4.770159078442129, "grad_norm": 0.24528309024526104, "learning_rate": 2.615513229653366e-07, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.14497415721416473, "step": 2900, "valid_targets_mean": 4532.6, "valid_targets_min": 613 }, { "epoch": 4.77838727372463, "grad_norm": 0.2573155357244181, "learning_rate": 2.4336752647561304e-07, "loss": 0.397, "loss_nan_ranks": 0, "loss_rank_avg": 0.12354221940040588, "step": 2905, "valid_targets_mean": 3717.2, "valid_targets_min": 1137 }, { "epoch": 4.786615469007131, "grad_norm": 0.24346065047412174, "learning_rate": 2.2583493733926655e-07, "loss": 0.3876, "loss_nan_ranks": 0, "loss_rank_avg": 0.10926102101802826, "step": 2910, "valid_targets_mean": 3432.2, "valid_targets_min": 766 }, { "epoch": 4.794843664289632, "grad_norm": 0.24025285632400223, "learning_rate": 2.0895413345594527e-07, "loss": 0.3908, "loss_nan_ranks": 0, "loss_rank_avg": 0.14541694521903992, "step": 2915, "valid_targets_mean": 4030.4, "valid_targets_min": 1035 }, { "epoch": 4.803071859572134, "grad_norm": 0.2502583573082134, "learning_rate": 1.9272567124150932e-07, "loss": 0.3916, "loss_nan_ranks": 0, "loss_rank_avg": 0.11226493120193481, "step": 2920, "valid_targets_mean": 3379.8, "valid_targets_min": 1265 }, { "epoch": 4.811300054854636, "grad_norm": 0.27135058705651266, "learning_rate": 1.771500856096875e-07, "loss": 0.3932, "loss_nan_ranks": 0, "loss_rank_avg": 0.11371229588985443, "step": 2925, "valid_targets_mean": 2594.7, "valid_targets_min": 1135 }, { "epoch": 4.819528250137137, "grad_norm": 0.28328121691854996, "learning_rate": 1.6222788995444272e-07, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.06900590658187866, "step": 2930, "valid_targets_mean": 972.6, "valid_targets_min": 546 }, { "epoch": 4.827756445419638, "grad_norm": 0.2318305134373849, "learning_rate": 1.4795957613305877e-07, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.16254112124443054, "step": 2935, "valid_targets_mean": 5099.9, "valid_targets_min": 1465 }, { "epoch": 4.835984640702139, "grad_norm": 0.24068535986602976, "learning_rate": 1.3434561444992e-07, "loss": 0.3936, "loss_nan_ranks": 0, "loss_rank_avg": 0.15346771478652954, "step": 2940, "valid_targets_mean": 5051.9, "valid_targets_min": 986 }, { "epoch": 4.84421283598464, "grad_norm": 0.39007386893679075, "learning_rate": 1.2138645364101032e-07, "loss": 0.3477, "loss_nan_ranks": 0, "loss_rank_avg": 0.1031792089343071, "step": 2945, "valid_targets_mean": 6354.4, "valid_targets_min": 348 }, { "epoch": 4.852441031267142, "grad_norm": 0.3829605064351524, "learning_rate": 1.0908252085912952e-07, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.07880100607872009, "step": 2950, "valid_targets_mean": 6446.1, "valid_targets_min": 139 }, { "epoch": 4.860669226549644, "grad_norm": 0.3816630053349074, "learning_rate": 9.743422165980454e-08, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.06825752556324005, "step": 2955, "valid_targets_mean": 3949.5, "valid_targets_min": 306 }, { "epoch": 4.868897421832145, "grad_norm": 0.3686134242305812, "learning_rate": 8.64419399879246e-08, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.09232122451066971, "step": 2960, "valid_targets_mean": 6445.5, "valid_targets_min": 501 }, { "epoch": 4.877125617114646, "grad_norm": 0.35617768490637586, "learning_rate": 7.61060381650891e-08, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.08181267231702805, "step": 2965, "valid_targets_mean": 6484.1, "valid_targets_min": 702 }, { "epoch": 4.885353812397147, "grad_norm": 0.3539720544440604, "learning_rate": 6.642685687766159e-08, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.08130834996700287, "step": 2970, "valid_targets_mean": 7440.5, "valid_targets_min": 914 }, { "epoch": 4.893582007679649, "grad_norm": 0.34241063452198034, "learning_rate": 5.740471516553881e-08, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.09114379435777664, "step": 2975, "valid_targets_mean": 7078.0, "valid_targets_min": 280 }, { "epoch": 4.90181020296215, "grad_norm": 0.3171560903782373, "learning_rate": 4.9039910411643466e-08, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.08341857045888901, "step": 2980, "valid_targets_mean": 6463.1, "valid_targets_min": 1221 }, { "epoch": 4.910038398244652, "grad_norm": 0.3168640296013643, "learning_rate": 4.133271833210772e-08, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.06438249349594116, "step": 2985, "valid_targets_mean": 6061.8, "valid_targets_min": 1412 }, { "epoch": 4.918266593527153, "grad_norm": 0.33532587380496615, "learning_rate": 3.428339296719596e-08, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.10326523333787918, "step": 2990, "valid_targets_mean": 6472.4, "valid_targets_min": 277 }, { "epoch": 4.926494788809654, "grad_norm": 0.2979188578639744, "learning_rate": 2.789216667293593e-08, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.06032399833202362, "step": 2995, "valid_targets_mean": 7596.1, "valid_targets_min": 2298 }, { "epoch": 4.934722984092156, "grad_norm": 0.3044209930110469, "learning_rate": 2.2159250113438223e-08, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.07601773738861084, "step": 3000, "valid_targets_mean": 7278.7, "valid_targets_min": 299 }, { "epoch": 4.942951179374657, "grad_norm": 0.3175588292516497, "learning_rate": 1.708483225397961e-08, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.09058444201946259, "step": 3005, "valid_targets_mean": 6472.9, "valid_targets_min": 578 }, { "epoch": 4.951179374657158, "grad_norm": 0.32066451016675285, "learning_rate": 1.266908035475467e-08, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.08107155561447144, "step": 3010, "valid_targets_mean": 6411.4, "valid_targets_min": 176 }, { "epoch": 4.95940756993966, "grad_norm": 0.31698950477993576, "learning_rate": 8.912139965369105e-09, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.09014058858156204, "step": 3015, "valid_targets_mean": 5064.2, "valid_targets_min": 746 }, { "epoch": 4.967635765222162, "grad_norm": 0.316410358732829, "learning_rate": 5.814134920048009e-09, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.10155069828033447, "step": 3020, "valid_targets_mean": 6593.2, "valid_targets_min": 1045 }, { "epoch": 4.975863960504663, "grad_norm": 0.3192028950014772, "learning_rate": 3.3751673335458147e-09, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.06748147308826447, "step": 3025, "valid_targets_mean": 5822.4, "valid_targets_min": 952 }, { "epoch": 4.984092155787164, "grad_norm": 0.31201193824927753, "learning_rate": 1.5953175977778679e-09, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1104644238948822, "step": 3030, "valid_targets_mean": 8131.2, "valid_targets_min": 270 }, { "epoch": 4.992320351069665, "grad_norm": 0.3171727370891135, "learning_rate": 4.746443791869837e-10, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.07531018555164337, "step": 3035, "valid_targets_mean": 6484.8, "valid_targets_min": 1247 }, { "epoch": 5.0, "grad_norm": 1.355991457881435, "learning_rate": 1.3184616789452264e-11, "loss": 0.2833, "loss_nan_ranks": 0, "loss_rank_avg": 0.36725589632987976, "step": 3040, "valid_targets_mean": 6065.3, "valid_targets_min": 1413 }, { "epoch": 5.0, "step": 3040, "total_flos": 9.271417366388933e+18, "train_loss": 0.0, "train_runtime": 4.0738, "train_samples_per_second": 71564.652, "train_steps_per_second": 746.232 } ], "logging_steps": 5, "max_steps": 3040, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 300, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 9.271417366388933e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }