Files
llama3_3b_instruct_vallina_…/trainer_log.jsonl
ModelHub XC 2e0befc9df 初始化项目,由ModelHub XC社区提供模型
Model: Yaseal/llama3_3b_instruct_vallina_full_sft_30k
Source: Original Platform
2026-04-11 23:15:17 +08:00

119 lines
22 KiB
JSON

{"current_steps": 10, "total_steps": 1164, "loss": 0.8691, "lr": 1.5384615384615387e-06, "epoch": 0.01718213058419244, "percentage": 0.86, "elapsed_time": "0:02:07", "remaining_time": "4:04:26"}
{"current_steps": 20, "total_steps": 1164, "loss": 0.7729, "lr": 3.247863247863248e-06, "epoch": 0.03436426116838488, "percentage": 1.72, "elapsed_time": "0:04:13", "remaining_time": "4:01:13"}
{"current_steps": 30, "total_steps": 1164, "loss": 0.6791, "lr": 4.957264957264958e-06, "epoch": 0.05154639175257732, "percentage": 2.58, "elapsed_time": "0:06:18", "remaining_time": "3:58:24"}
{"current_steps": 40, "total_steps": 1164, "loss": 0.6453, "lr": 6.666666666666667e-06, "epoch": 0.06872852233676977, "percentage": 3.44, "elapsed_time": "0:08:23", "remaining_time": "3:55:45"}
{"current_steps": 50, "total_steps": 1164, "loss": 0.612, "lr": 8.376068376068377e-06, "epoch": 0.0859106529209622, "percentage": 4.3, "elapsed_time": "0:10:29", "remaining_time": "3:53:34"}
{"current_steps": 60, "total_steps": 1164, "loss": 0.6023, "lr": 1.0085470085470086e-05, "epoch": 0.10309278350515463, "percentage": 5.15, "elapsed_time": "0:12:34", "remaining_time": "3:51:16"}
{"current_steps": 70, "total_steps": 1164, "loss": 0.5756, "lr": 1.1794871794871796e-05, "epoch": 0.12027491408934708, "percentage": 6.01, "elapsed_time": "0:14:39", "remaining_time": "3:49:07"}
{"current_steps": 80, "total_steps": 1164, "loss": 0.5798, "lr": 1.3504273504273506e-05, "epoch": 0.13745704467353953, "percentage": 6.87, "elapsed_time": "0:16:44", "remaining_time": "3:46:57"}
{"current_steps": 90, "total_steps": 1164, "loss": 0.5444, "lr": 1.5213675213675214e-05, "epoch": 0.15463917525773196, "percentage": 7.73, "elapsed_time": "0:18:50", "remaining_time": "3:44:49"}
{"current_steps": 100, "total_steps": 1164, "loss": 0.5604, "lr": 1.6923076923076924e-05, "epoch": 0.1718213058419244, "percentage": 8.59, "elapsed_time": "0:20:56", "remaining_time": "3:42:45"}
{"current_steps": 110, "total_steps": 1164, "loss": 0.5569, "lr": 1.8632478632478636e-05, "epoch": 0.18900343642611683, "percentage": 9.45, "elapsed_time": "0:23:01", "remaining_time": "3:40:36"}
{"current_steps": 120, "total_steps": 1164, "loss": 0.5541, "lr": 1.999981993260809e-05, "epoch": 0.20618556701030927, "percentage": 10.31, "elapsed_time": "0:25:06", "remaining_time": "3:38:27"}
{"current_steps": 130, "total_steps": 1164, "loss": 0.5664, "lr": 1.9993518254774517e-05, "epoch": 0.22336769759450173, "percentage": 11.17, "elapsed_time": "0:27:12", "remaining_time": "3:36:21"}
{"current_steps": 140, "total_steps": 1164, "loss": 0.5433, "lr": 1.9978219691148676e-05, "epoch": 0.24054982817869416, "percentage": 12.03, "elapsed_time": "0:29:17", "remaining_time": "3:34:11"}
{"current_steps": 150, "total_steps": 1164, "loss": 0.5348, "lr": 1.9953938014600757e-05, "epoch": 0.25773195876288657, "percentage": 12.89, "elapsed_time": "0:31:22", "remaining_time": "3:32:05"}
{"current_steps": 160, "total_steps": 1164, "loss": 0.5427, "lr": 1.9920695085247012e-05, "epoch": 0.27491408934707906, "percentage": 13.75, "elapsed_time": "0:33:27", "remaining_time": "3:29:59"}
{"current_steps": 170, "total_steps": 1164, "loss": 0.5441, "lr": 1.9878520830769675e-05, "epoch": 0.2920962199312715, "percentage": 14.6, "elapsed_time": "0:35:33", "remaining_time": "3:27:53"}
{"current_steps": 180, "total_steps": 1164, "loss": 0.5425, "lr": 1.9827453219473925e-05, "epoch": 0.30927835051546393, "percentage": 15.46, "elapsed_time": "0:37:38", "remaining_time": "3:25:47"}
{"current_steps": 190, "total_steps": 1164, "loss": 0.5386, "lr": 1.9767538226106078e-05, "epoch": 0.32646048109965636, "percentage": 16.32, "elapsed_time": "0:39:43", "remaining_time": "3:23:39"}
{"current_steps": 200, "total_steps": 1164, "loss": 0.54, "lr": 1.9698829790463792e-05, "epoch": 0.3436426116838488, "percentage": 17.18, "elapsed_time": "0:41:48", "remaining_time": "3:21:31"}
{"current_steps": 210, "total_steps": 1164, "loss": 0.5302, "lr": 1.962138976883558e-05, "epoch": 0.36082474226804123, "percentage": 18.04, "elapsed_time": "0:43:53", "remaining_time": "3:19:25"}
{"current_steps": 220, "total_steps": 1164, "loss": 0.5323, "lr": 1.9535287878313315e-05, "epoch": 0.37800687285223367, "percentage": 18.9, "elapsed_time": "0:45:59", "remaining_time": "3:17:19"}
{"current_steps": 230, "total_steps": 1164, "loss": 0.5194, "lr": 1.9440601634027892e-05, "epoch": 0.3951890034364261, "percentage": 19.76, "elapsed_time": "0:48:05", "remaining_time": "3:15:15"}
{"current_steps": 240, "total_steps": 1164, "loss": 0.5298, "lr": 1.9337416279364486e-05, "epoch": 0.41237113402061853, "percentage": 20.62, "elapsed_time": "0:50:10", "remaining_time": "3:13:10"}
{"current_steps": 250, "total_steps": 1164, "loss": 0.5246, "lr": 1.922582470922034e-05, "epoch": 0.42955326460481097, "percentage": 21.48, "elapsed_time": "0:52:15", "remaining_time": "3:11:04"}
{"current_steps": 260, "total_steps": 1164, "loss": 0.5066, "lr": 1.910592738637407e-05, "epoch": 0.44673539518900346, "percentage": 22.34, "elapsed_time": "0:54:21", "remaining_time": "3:08:58"}
{"current_steps": 270, "total_steps": 1164, "loss": 0.5303, "lr": 1.897783225104181e-05, "epoch": 0.4639175257731959, "percentage": 23.2, "elapsed_time": "0:56:26", "remaining_time": "3:06:52"}
{"current_steps": 280, "total_steps": 1164, "loss": 0.5225, "lr": 1.8841654623701673e-05, "epoch": 0.48109965635738833, "percentage": 24.05, "elapsed_time": "0:58:31", "remaining_time": "3:04:45"}
{"current_steps": 290, "total_steps": 1164, "loss": 0.5052, "lr": 1.869751710127392e-05, "epoch": 0.49828178694158076, "percentage": 24.91, "elapsed_time": "1:00:36", "remaining_time": "3:02:39"}
{"current_steps": 300, "total_steps": 1164, "loss": 0.5143, "lr": 1.8545549446750392e-05, "epoch": 0.5154639175257731, "percentage": 25.77, "elapsed_time": "1:02:42", "remaining_time": "3:00:34"}
{"current_steps": 310, "total_steps": 1164, "loss": 0.5129, "lr": 1.8385888472372474e-05, "epoch": 0.5326460481099656, "percentage": 26.63, "elapsed_time": "1:04:47", "remaining_time": "2:58:29"}
{"current_steps": 320, "total_steps": 1164, "loss": 0.5131, "lr": 1.8218677916462882e-05, "epoch": 0.5498281786941581, "percentage": 27.49, "elapsed_time": "1:06:52", "remaining_time": "2:56:23"}
{"current_steps": 330, "total_steps": 1164, "loss": 0.5099, "lr": 1.8044068314022057e-05, "epoch": 0.5670103092783505, "percentage": 28.35, "elapsed_time": "1:08:58", "remaining_time": "2:54:18"}
{"current_steps": 340, "total_steps": 1164, "loss": 0.5166, "lr": 1.786221686120567e-05, "epoch": 0.584192439862543, "percentage": 29.21, "elapsed_time": "1:11:03", "remaining_time": "2:52:11"}
{"current_steps": 350, "total_steps": 1164, "loss": 0.5228, "lr": 1.7673287273805342e-05, "epoch": 0.6013745704467354, "percentage": 30.07, "elapsed_time": "1:13:08", "remaining_time": "2:50:06"}
{"current_steps": 360, "total_steps": 1164, "loss": 0.5099, "lr": 1.7477449639859876e-05, "epoch": 0.6185567010309279, "percentage": 30.93, "elapsed_time": "1:15:13", "remaining_time": "2:48:01"}
{"current_steps": 370, "total_steps": 1164, "loss": 0.5047, "lr": 1.7274880266529716e-05, "epoch": 0.6357388316151202, "percentage": 31.79, "elapsed_time": "1:17:19", "remaining_time": "2:45:56"}
{"current_steps": 380, "total_steps": 1164, "loss": 0.4984, "lr": 1.7065761521372562e-05, "epoch": 0.6529209621993127, "percentage": 32.65, "elapsed_time": "1:19:24", "remaining_time": "2:43:49"}
{"current_steps": 390, "total_steps": 1164, "loss": 0.5079, "lr": 1.6850281668162908e-05, "epoch": 0.6701030927835051, "percentage": 33.51, "elapsed_time": "1:21:29", "remaining_time": "2:41:44"}
{"current_steps": 400, "total_steps": 1164, "loss": 0.5086, "lr": 1.6628634697403447e-05, "epoch": 0.6872852233676976, "percentage": 34.36, "elapsed_time": "1:23:34", "remaining_time": "2:39:38"}
{"current_steps": 410, "total_steps": 1164, "loss": 0.4957, "lr": 1.6401020151680815e-05, "epoch": 0.7044673539518901, "percentage": 35.22, "elapsed_time": "1:25:40", "remaining_time": "2:37:33"}
{"current_steps": 420, "total_steps": 1164, "loss": 0.5021, "lr": 1.6167642946022956e-05, "epoch": 0.7216494845360825, "percentage": 36.08, "elapsed_time": "1:27:45", "remaining_time": "2:35:27"}
{"current_steps": 430, "total_steps": 1164, "loss": 0.5146, "lr": 1.592871318341986e-05, "epoch": 0.738831615120275, "percentage": 36.94, "elapsed_time": "1:29:51", "remaining_time": "2:33:22"}
{"current_steps": 440, "total_steps": 1164, "loss": 0.5087, "lr": 1.5684445965673693e-05, "epoch": 0.7560137457044673, "percentage": 37.8, "elapsed_time": "1:31:56", "remaining_time": "2:31:16"}
{"current_steps": 450, "total_steps": 1164, "loss": 0.5065, "lr": 1.5435061199748625e-05, "epoch": 0.7731958762886598, "percentage": 38.66, "elapsed_time": "1:34:01", "remaining_time": "2:29:10"}
{"current_steps": 460, "total_steps": 1164, "loss": 0.5092, "lr": 1.5180783399794749e-05, "epoch": 0.7903780068728522, "percentage": 39.52, "elapsed_time": "1:36:06", "remaining_time": "2:27:05"}
{"current_steps": 470, "total_steps": 1164, "loss": 0.4999, "lr": 1.4921841485024236e-05, "epoch": 0.8075601374570447, "percentage": 40.38, "elapsed_time": "1:38:12", "remaining_time": "2:25:00"}
{"current_steps": 480, "total_steps": 1164, "loss": 0.4992, "lr": 1.4658468573621752e-05, "epoch": 0.8247422680412371, "percentage": 41.24, "elapsed_time": "1:40:17", "remaining_time": "2:22:54"}
{"current_steps": 490, "total_steps": 1164, "loss": 0.5041, "lr": 1.4390901772874668e-05, "epoch": 0.8419243986254296, "percentage": 42.1, "elapsed_time": "1:42:23", "remaining_time": "2:20:49"}
{"current_steps": 500, "total_steps": 1164, "loss": 0.4942, "lr": 1.4119381965711976e-05, "epoch": 0.8591065292096219, "percentage": 42.96, "elapsed_time": "1:44:28", "remaining_time": "2:18:44"}
{"current_steps": 510, "total_steps": 1164, "loss": 0.4877, "lr": 1.3844153593844098e-05, "epoch": 0.8762886597938144, "percentage": 43.81, "elapsed_time": "1:46:33", "remaining_time": "2:16:38"}
{"current_steps": 520, "total_steps": 1164, "loss": 0.4868, "lr": 1.356546443769885e-05, "epoch": 0.8934707903780069, "percentage": 44.67, "elapsed_time": "1:48:38", "remaining_time": "2:14:33"}
{"current_steps": 530, "total_steps": 1164, "loss": 0.5083, "lr": 1.328356539335161e-05, "epoch": 0.9106529209621993, "percentage": 45.53, "elapsed_time": "1:50:44", "remaining_time": "2:12:27"}
{"current_steps": 540, "total_steps": 1164, "loss": 0.4913, "lr": 1.2998710246650594e-05, "epoch": 0.9278350515463918, "percentage": 46.39, "elapsed_time": "1:52:49", "remaining_time": "2:10:22"}
{"current_steps": 550, "total_steps": 1164, "loss": 0.494, "lr": 1.2711155444740529e-05, "epoch": 0.9450171821305842, "percentage": 47.25, "elapsed_time": "1:54:55", "remaining_time": "2:08:17"}
{"current_steps": 560, "total_steps": 1164, "loss": 0.5144, "lr": 1.242115986519044e-05, "epoch": 0.9621993127147767, "percentage": 48.11, "elapsed_time": "1:57:00", "remaining_time": "2:06:11"}
{"current_steps": 570, "total_steps": 1164, "loss": 0.4891, "lr": 1.2128984582933397e-05, "epoch": 0.979381443298969, "percentage": 48.97, "elapsed_time": "1:59:04", "remaining_time": "2:04:05"}
{"current_steps": 580, "total_steps": 1164, "loss": 0.4825, "lr": 1.1834892635228024e-05, "epoch": 0.9965635738831615, "percentage": 49.83, "elapsed_time": "2:01:10", "remaining_time": "2:02:00"}
{"current_steps": 590, "total_steps": 1164, "loss": 0.4331, "lr": 1.1539148784853404e-05, "epoch": 1.013745704467354, "percentage": 50.69, "elapsed_time": "2:04:10", "remaining_time": "2:00:48"}
{"current_steps": 600, "total_steps": 1164, "loss": 0.4127, "lr": 1.1242019281750525e-05, "epoch": 1.0309278350515463, "percentage": 51.55, "elapsed_time": "2:06:16", "remaining_time": "1:58:41"}
{"current_steps": 610, "total_steps": 1164, "loss": 0.4022, "lr": 1.0943771623324884e-05, "epoch": 1.0481099656357389, "percentage": 52.41, "elapsed_time": "2:08:21", "remaining_time": "1:56:34"}
{"current_steps": 620, "total_steps": 1164, "loss": 0.4074, "lr": 1.064467431362603e-05, "epoch": 1.0652920962199313, "percentage": 53.26, "elapsed_time": "2:10:27", "remaining_time": "1:54:27"}
{"current_steps": 630, "total_steps": 1164, "loss": 0.4173, "lr": 1.0344996621620862e-05, "epoch": 1.0824742268041236, "percentage": 54.12, "elapsed_time": "2:12:33", "remaining_time": "1:52:21"}
{"current_steps": 640, "total_steps": 1164, "loss": 0.4071, "lr": 1.004500833877828e-05, "epoch": 1.0996563573883162, "percentage": 54.98, "elapsed_time": "2:14:38", "remaining_time": "1:50:14"}
{"current_steps": 650, "total_steps": 1164, "loss": 0.4128, "lr": 9.744979536183458e-06, "epoch": 1.1168384879725086, "percentage": 55.84, "elapsed_time": "2:16:43", "remaining_time": "1:48:07"}
{"current_steps": 660, "total_steps": 1164, "loss": 0.4162, "lr": 9.445180321400373e-06, "epoch": 1.134020618556701, "percentage": 56.7, "elapsed_time": "2:18:49", "remaining_time": "1:46:00"}
{"current_steps": 670, "total_steps": 1164, "loss": 0.4087, "lr": 9.145880595301495e-06, "epoch": 1.1512027491408934, "percentage": 57.56, "elapsed_time": "2:20:54", "remaining_time": "1:43:53"}
{"current_steps": 680, "total_steps": 1164, "loss": 0.4104, "lr": 8.847349809083557e-06, "epoch": 1.168384879725086, "percentage": 58.42, "elapsed_time": "2:23:00", "remaining_time": "1:41:47"}
{"current_steps": 690, "total_steps": 1164, "loss": 0.4186, "lr": 8.54985672168817e-06, "epoch": 1.1855670103092784, "percentage": 59.28, "elapsed_time": "2:25:06", "remaining_time": "1:39:40"}
{"current_steps": 700, "total_steps": 1164, "loss": 0.4027, "lr": 8.253669157845632e-06, "epoch": 1.2027491408934707, "percentage": 60.14, "elapsed_time": "2:27:11", "remaining_time": "1:37:34"}
{"current_steps": 710, "total_steps": 1164, "loss": 0.3996, "lr": 7.959053766959785e-06, "epoch": 1.2199312714776633, "percentage": 61.0, "elapsed_time": "2:29:17", "remaining_time": "1:35:27"}
{"current_steps": 720, "total_steps": 1164, "loss": 0.4053, "lr": 7.666275783051012e-06, "epoch": 1.2371134020618557, "percentage": 61.86, "elapsed_time": "2:31:22", "remaining_time": "1:33:20"}
{"current_steps": 730, "total_steps": 1164, "loss": 0.4065, "lr": 7.375598785973429e-06, "epoch": 1.254295532646048, "percentage": 62.71, "elapsed_time": "2:33:27", "remaining_time": "1:31:14"}
{"current_steps": 740, "total_steps": 1164, "loss": 0.4041, "lr": 7.087284464121305e-06, "epoch": 1.2714776632302405, "percentage": 63.57, "elapsed_time": "2:35:33", "remaining_time": "1:29:07"}
{"current_steps": 750, "total_steps": 1164, "loss": 0.4055, "lr": 6.801592378838282e-06, "epoch": 1.2886597938144329, "percentage": 64.43, "elapsed_time": "2:37:38", "remaining_time": "1:27:01"}
{"current_steps": 760, "total_steps": 1164, "loss": 0.4143, "lr": 6.518779730741555e-06, "epoch": 1.3058419243986255, "percentage": 65.29, "elapsed_time": "2:39:43", "remaining_time": "1:24:54"}
{"current_steps": 770, "total_steps": 1164, "loss": 0.3931, "lr": 6.239101128171317e-06, "epoch": 1.3230240549828178, "percentage": 66.15, "elapsed_time": "2:41:49", "remaining_time": "1:22:48"}
{"current_steps": 780, "total_steps": 1164, "loss": 0.4126, "lr": 5.9628083579739715e-06, "epoch": 1.3402061855670104, "percentage": 67.01, "elapsed_time": "2:43:54", "remaining_time": "1:20:41"}
{"current_steps": 790, "total_steps": 1164, "loss": 0.4108, "lr": 5.690150158825462e-06, "epoch": 1.3573883161512028, "percentage": 67.87, "elapsed_time": "2:46:00", "remaining_time": "1:18:35"}
{"current_steps": 800, "total_steps": 1164, "loss": 0.4057, "lr": 5.421371997298781e-06, "epoch": 1.3745704467353952, "percentage": 68.73, "elapsed_time": "2:48:05", "remaining_time": "1:16:28"}
{"current_steps": 810, "total_steps": 1164, "loss": 0.4018, "lr": 5.156715846877234e-06, "epoch": 1.3917525773195876, "percentage": 69.59, "elapsed_time": "2:50:10", "remaining_time": "1:14:22"}
{"current_steps": 820, "total_steps": 1164, "loss": 0.4039, "lr": 4.896419970112499e-06, "epoch": 1.40893470790378, "percentage": 70.45, "elapsed_time": "2:52:15", "remaining_time": "1:12:16"}
{"current_steps": 830, "total_steps": 1164, "loss": 0.3968, "lr": 4.640718704123472e-06, "epoch": 1.4261168384879725, "percentage": 71.31, "elapsed_time": "2:54:20", "remaining_time": "1:10:09"}
{"current_steps": 840, "total_steps": 1164, "loss": 0.4049, "lr": 4.389842249629095e-06, "epoch": 1.443298969072165, "percentage": 72.16, "elapsed_time": "2:56:25", "remaining_time": "1:08:03"}
{"current_steps": 850, "total_steps": 1164, "loss": 0.4046, "lr": 4.144016463705081e-06, "epoch": 1.4604810996563573, "percentage": 73.02, "elapsed_time": "2:58:31", "remaining_time": "1:05:56"}
{"current_steps": 860, "total_steps": 1164, "loss": 0.3988, "lr": 3.903462656451074e-06, "epoch": 1.47766323024055, "percentage": 73.88, "elapsed_time": "3:00:37", "remaining_time": "1:03:50"}
{"current_steps": 870, "total_steps": 1164, "loss": 0.3968, "lr": 3.668397391751336e-06, "epoch": 1.4948453608247423, "percentage": 74.74, "elapsed_time": "3:02:42", "remaining_time": "1:01:44"}
{"current_steps": 880, "total_steps": 1164, "loss": 0.4013, "lr": 3.4390322923083385e-06, "epoch": 1.5120274914089347, "percentage": 75.6, "elapsed_time": "3:04:48", "remaining_time": "0:59:38"}
{"current_steps": 890, "total_steps": 1164, "loss": 0.391, "lr": 3.2155738491247303e-06, "epoch": 1.529209621993127, "percentage": 76.46, "elapsed_time": "3:06:53", "remaining_time": "0:57:32"}
{"current_steps": 900, "total_steps": 1164, "loss": 0.3999, "lr": 2.99822323560525e-06, "epoch": 1.5463917525773194, "percentage": 77.32, "elapsed_time": "3:08:59", "remaining_time": "0:55:26"}
{"current_steps": 910, "total_steps": 1164, "loss": 0.4, "lr": 2.787176126445923e-06, "epoch": 1.563573883161512, "percentage": 78.18, "elapsed_time": "3:11:04", "remaining_time": "0:53:20"}
{"current_steps": 920, "total_steps": 1164, "loss": 0.4084, "lr": 2.582622521473588e-06, "epoch": 1.5807560137457046, "percentage": 79.04, "elapsed_time": "3:13:10", "remaining_time": "0:51:13"}
{"current_steps": 930, "total_steps": 1164, "loss": 0.4019, "lr": 2.384746574594343e-06, "epoch": 1.597938144329897, "percentage": 79.9, "elapsed_time": "3:15:15", "remaining_time": "0:49:07"}
{"current_steps": 940, "total_steps": 1164, "loss": 0.3987, "lr": 2.1937264280049365e-06, "epoch": 1.6151202749140894, "percentage": 80.76, "elapsed_time": "3:17:20", "remaining_time": "0:47:01"}
{"current_steps": 950, "total_steps": 1164, "loss": 0.4012, "lr": 2.0097340518163e-06, "epoch": 1.6323024054982818, "percentage": 81.62, "elapsed_time": "3:19:26", "remaining_time": "0:44:55"}
{"current_steps": 960, "total_steps": 1164, "loss": 0.3925, "lr": 1.8329350892336616e-06, "epoch": 1.6494845360824741, "percentage": 82.47, "elapsed_time": "3:21:31", "remaining_time": "0:42:49"}
{"current_steps": 970, "total_steps": 1164, "loss": 0.4053, "lr": 1.6634887074325844e-06, "epoch": 1.6666666666666665, "percentage": 83.33, "elapsed_time": "3:23:37", "remaining_time": "0:40:43"}
{"current_steps": 980, "total_steps": 1164, "loss": 0.4015, "lr": 1.5015474542651964e-06, "epoch": 1.6838487972508591, "percentage": 84.19, "elapsed_time": "3:25:42", "remaining_time": "0:38:37"}
{"current_steps": 990, "total_steps": 1164, "loss": 0.404, "lr": 1.3472571209256157e-06, "epoch": 1.7010309278350515, "percentage": 85.05, "elapsed_time": "3:27:48", "remaining_time": "0:36:31"}
{"current_steps": 1000, "total_steps": 1164, "loss": 0.3879, "lr": 1.200756610698205e-06, "epoch": 1.718213058419244, "percentage": 85.91, "elapsed_time": "3:29:53", "remaining_time": "0:34:25"}
{"current_steps": 1000, "total_steps": 1164, "eval_loss": 0.47505149245262146, "epoch": 1.718213058419244, "percentage": 85.91, "elapsed_time": "3:30:15", "remaining_time": "0:34:28"}
{"current_steps": 1010, "total_steps": 1164, "loss": 0.3909, "lr": 1.0621778139068128e-06, "epoch": 1.7353951890034365, "percentage": 86.77, "elapsed_time": "3:32:21", "remaining_time": "0:32:22"}
{"current_steps": 1020, "total_steps": 1164, "loss": 0.3951, "lr": 9.316454891775983e-07, "epoch": 1.7525773195876289, "percentage": 87.63, "elapsed_time": "3:34:26", "remaining_time": "0:30:16"}
{"current_steps": 1030, "total_steps": 1164, "loss": 0.3917, "lr": 8.092771511223185e-07, "epoch": 1.7697594501718212, "percentage": 88.49, "elapsed_time": "3:36:31", "remaining_time": "0:28:10"}
{"current_steps": 1040, "total_steps": 1164, "loss": 0.3925, "lr": 6.951829645431985e-07, "epoch": 1.7869415807560136, "percentage": 89.35, "elapsed_time": "3:38:36", "remaining_time": "0:26:03"}
{"current_steps": 1050, "total_steps": 1164, "loss": 0.3984, "lr": 5.894656452546343e-07, "epoch": 1.8041237113402062, "percentage": 90.21, "elapsed_time": "3:40:41", "remaining_time": "0:23:57"}
{"current_steps": 1060, "total_steps": 1164, "loss": 0.3977, "lr": 4.92220367611006e-07, "epoch": 1.8213058419243986, "percentage": 91.07, "elapsed_time": "3:42:46", "remaining_time": "0:21:51"}
{"current_steps": 1070, "total_steps": 1164, "loss": 0.402, "lr": 4.035346788238681e-07, "epoch": 1.8384879725085912, "percentage": 91.92, "elapsed_time": "3:44:51", "remaining_time": "0:19:45"}
{"current_steps": 1080, "total_steps": 1164, "loss": 0.397, "lr": 3.2348842014562564e-07, "epoch": 1.8556701030927836, "percentage": 92.78, "elapsed_time": "3:46:57", "remaining_time": "0:17:39"}
{"current_steps": 1090, "total_steps": 1164, "loss": 0.4038, "lr": 2.5215365499069446e-07, "epoch": 1.872852233676976, "percentage": 93.64, "elapsed_time": "3:49:02", "remaining_time": "0:15:32"}
{"current_steps": 1100, "total_steps": 1164, "loss": 0.4018, "lr": 1.895946040588048e-07, "epoch": 1.8900343642611683, "percentage": 94.5, "elapsed_time": "3:51:08", "remaining_time": "0:13:26"}
{"current_steps": 1110, "total_steps": 1164, "loss": 0.3945, "lr": 1.3586758751890638e-07, "epoch": 1.9072164948453607, "percentage": 95.36, "elapsed_time": "3:53:13", "remaining_time": "0:11:20"}
{"current_steps": 1120, "total_steps": 1164, "loss": 0.411, "lr": 9.10209743056889e-08, "epoch": 1.9243986254295533, "percentage": 96.22, "elapsed_time": "3:55:18", "remaining_time": "0:09:14"}
{"current_steps": 1130, "total_steps": 1164, "loss": 0.4021, "lr": 5.509513857437365e-08, "epoch": 1.9415807560137457, "percentage": 97.08, "elapsed_time": "3:57:24", "remaining_time": "0:07:08"}
{"current_steps": 1140, "total_steps": 1164, "loss": 0.3981, "lr": 2.812242335299642e-08, "epoch": 1.9587628865979383, "percentage": 97.94, "elapsed_time": "3:59:29", "remaining_time": "0:05:02"}
{"current_steps": 1150, "total_steps": 1164, "loss": 0.3999, "lr": 1.0127111424872437e-08, "epoch": 1.9759450171821307, "percentage": 98.8, "elapsed_time": "4:01:34", "remaining_time": "0:02:56"}
{"current_steps": 1160, "total_steps": 1164, "loss": 0.3927, "lr": 1.125403467490127e-09, "epoch": 1.993127147766323, "percentage": 99.66, "elapsed_time": "4:03:40", "remaining_time": "0:00:50"}
{"current_steps": 1164, "total_steps": 1164, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "4:05:24", "remaining_time": "0:00:00"}