Model: cjiao/OpenThoughts3-greedy-groups-top-openthinker3-1.5B-checkpoint-375-80 Source: Original Platform
162 lines
28 KiB
JSON
162 lines
28 KiB
JSON
{"current_steps": 1, "total_steps": 160, "loss": 1.4456, "lr": 0.00015998457923856519, "epoch": 0.0125, "percentage": 0.62, "elapsed_time": "0:01:38", "remaining_time": "4:22:01"}
|
|
{"current_steps": 2, "total_steps": 160, "loss": 4.3349, "lr": 0.00015993832289925785, "epoch": 0.025, "percentage": 1.25, "elapsed_time": "0:03:17", "remaining_time": "4:19:38"}
|
|
{"current_steps": 3, "total_steps": 160, "loss": 2.6695, "lr": 0.0001598612488147773, "epoch": 0.0375, "percentage": 1.88, "elapsed_time": "0:04:55", "remaining_time": "4:17:58"}
|
|
{"current_steps": 4, "total_steps": 160, "loss": 2.3799, "lr": 0.00015975338669865026, "epoch": 0.05, "percentage": 2.5, "elapsed_time": "0:06:34", "remaining_time": "4:16:43"}
|
|
{"current_steps": 5, "total_steps": 160, "loss": 2.0935, "lr": 0.00015961477813377576, "epoch": 0.0625, "percentage": 3.12, "elapsed_time": "0:08:13", "remaining_time": "4:15:10"}
|
|
{"current_steps": 6, "total_steps": 160, "loss": 1.8465, "lr": 0.00015944547655639412, "epoch": 0.075, "percentage": 3.75, "elapsed_time": "0:09:52", "remaining_time": "4:13:32"}
|
|
{"current_steps": 7, "total_steps": 160, "loss": 1.7321, "lr": 0.00015924554723548617, "epoch": 0.0875, "percentage": 4.38, "elapsed_time": "0:11:31", "remaining_time": "4:11:55"}
|
|
{"current_steps": 8, "total_steps": 160, "loss": 1.7284, "lr": 0.00015901506724761103, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:13:10", "remaining_time": "4:10:12"}
|
|
{"current_steps": 9, "total_steps": 160, "loss": 1.5971, "lr": 0.00015875412544719134, "epoch": 0.1125, "percentage": 5.62, "elapsed_time": "0:14:49", "remaining_time": "4:08:40"}
|
|
{"current_steps": 10, "total_steps": 160, "loss": 1.562, "lr": 0.00015846282243225845, "epoch": 0.125, "percentage": 6.25, "elapsed_time": "0:16:27", "remaining_time": "4:06:52"}
|
|
{"current_steps": 11, "total_steps": 160, "loss": 1.578, "lr": 0.0001581412705056698, "epoch": 0.1375, "percentage": 6.88, "elapsed_time": "0:18:06", "remaining_time": "4:05:12"}
|
|
{"current_steps": 12, "total_steps": 160, "loss": 1.4977, "lr": 0.00015778959363181415, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "0:19:44", "remaining_time": "4:03:33"}
|
|
{"current_steps": 13, "total_steps": 160, "loss": 1.5075, "lr": 0.0001574079273888208, "epoch": 0.1625, "percentage": 8.12, "elapsed_time": "0:21:23", "remaining_time": "4:01:52"}
|
|
{"current_steps": 14, "total_steps": 160, "loss": 1.4158, "lr": 0.00015699641891629178, "epoch": 0.175, "percentage": 8.75, "elapsed_time": "0:23:01", "remaining_time": "4:00:11"}
|
|
{"current_steps": 15, "total_steps": 160, "loss": 1.4219, "lr": 0.00015655522685857672, "epoch": 0.1875, "percentage": 9.38, "elapsed_time": "0:24:40", "remaining_time": "3:58:31"}
|
|
{"current_steps": 16, "total_steps": 160, "loss": 1.4006, "lr": 0.0001560845213036123, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:26:18", "remaining_time": "3:56:49"}
|
|
{"current_steps": 17, "total_steps": 160, "loss": 1.3675, "lr": 0.00015558448371735025, "epoch": 0.2125, "percentage": 10.62, "elapsed_time": "0:27:57", "remaining_time": "3:55:10"}
|
|
{"current_steps": 18, "total_steps": 160, "loss": 1.3369, "lr": 0.00015505530687379875, "epoch": 0.225, "percentage": 11.25, "elapsed_time": "0:29:36", "remaining_time": "3:53:33"}
|
|
{"current_steps": 19, "total_steps": 160, "loss": 1.3632, "lr": 0.00015449719478070428, "epoch": 0.2375, "percentage": 11.88, "elapsed_time": "0:31:14", "remaining_time": "3:51:50"}
|
|
{"current_steps": 20, "total_steps": 160, "loss": 1.3511, "lr": 0.00015391036260090294, "epoch": 0.25, "percentage": 12.5, "elapsed_time": "0:32:53", "remaining_time": "3:50:13"}
|
|
{"current_steps": 21, "total_steps": 160, "loss": 1.3641, "lr": 0.0001532950365693709, "epoch": 0.2625, "percentage": 13.12, "elapsed_time": "0:34:31", "remaining_time": "3:48:31"}
|
|
{"current_steps": 22, "total_steps": 160, "loss": 1.3441, "lr": 0.00015265145390600652, "epoch": 0.275, "percentage": 13.75, "elapsed_time": "0:36:09", "remaining_time": "3:46:47"}
|
|
{"current_steps": 23, "total_steps": 160, "loss": 1.3418, "lr": 0.00015197986272417774, "epoch": 0.2875, "percentage": 14.37, "elapsed_time": "0:37:48", "remaining_time": "3:45:10"}
|
|
{"current_steps": 24, "total_steps": 160, "loss": 1.3646, "lr": 0.00015128052193506944, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "0:39:26", "remaining_time": "3:43:30"}
|
|
{"current_steps": 25, "total_steps": 160, "loss": 1.2992, "lr": 0.0001505537011478684, "epoch": 0.3125, "percentage": 15.62, "elapsed_time": "0:41:05", "remaining_time": "3:41:53"}
|
|
{"current_steps": 26, "total_steps": 160, "loss": 1.3435, "lr": 0.0001497996805658238, "epoch": 0.325, "percentage": 16.25, "elapsed_time": "0:42:44", "remaining_time": "3:40:15"}
|
|
{"current_steps": 27, "total_steps": 160, "loss": 1.3, "lr": 0.00014901875087822337, "epoch": 0.3375, "percentage": 16.88, "elapsed_time": "0:44:22", "remaining_time": "3:38:37"}
|
|
{"current_steps": 28, "total_steps": 160, "loss": 1.3103, "lr": 0.0001482112131483274, "epoch": 0.35, "percentage": 17.5, "elapsed_time": "0:46:01", "remaining_time": "3:36:57"}
|
|
{"current_steps": 29, "total_steps": 160, "loss": 1.2731, "lr": 0.00014737737869730292, "epoch": 0.3625, "percentage": 18.12, "elapsed_time": "0:47:39", "remaining_time": "3:35:18"}
|
|
{"current_steps": 30, "total_steps": 160, "loss": 1.3211, "lr": 0.00014651756898420365, "epoch": 0.375, "percentage": 18.75, "elapsed_time": "0:49:18", "remaining_time": "3:33:38"}
|
|
{"current_steps": 31, "total_steps": 160, "loss": 1.2657, "lr": 0.0001456321154820411, "epoch": 0.3875, "percentage": 19.38, "elapsed_time": "0:50:56", "remaining_time": "3:31:57"}
|
|
{"current_steps": 32, "total_steps": 160, "loss": 1.3068, "lr": 0.00014472135954999581, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:52:34", "remaining_time": "3:30:16"}
|
|
{"current_steps": 33, "total_steps": 160, "loss": 1.2839, "lr": 0.00014378565230181657, "epoch": 0.4125, "percentage": 20.62, "elapsed_time": "0:54:12", "remaining_time": "3:28:37"}
|
|
{"current_steps": 34, "total_steps": 160, "loss": 1.2868, "lr": 0.0001428253544704596, "epoch": 0.425, "percentage": 21.25, "elapsed_time": "0:55:51", "remaining_time": "3:26:58"}
|
|
{"current_steps": 35, "total_steps": 160, "loss": 1.2815, "lr": 0.00014184083626901897, "epoch": 0.4375, "percentage": 21.88, "elapsed_time": "0:57:29", "remaining_time": "3:25:20"}
|
|
{"current_steps": 36, "total_steps": 160, "loss": 1.2895, "lr": 0.0001408324772480025, "epoch": 0.45, "percentage": 22.5, "elapsed_time": "0:59:07", "remaining_time": "3:23:40"}
|
|
{"current_steps": 37, "total_steps": 160, "loss": 1.2718, "lr": 0.00013980066614900776, "epoch": 0.4625, "percentage": 23.12, "elapsed_time": "1:00:45", "remaining_time": "3:22:00"}
|
|
{"current_steps": 38, "total_steps": 160, "loss": 1.2596, "lr": 0.00013874580075485485, "epoch": 0.475, "percentage": 23.75, "elapsed_time": "1:02:24", "remaining_time": "3:20:22"}
|
|
{"current_steps": 39, "total_steps": 160, "loss": 1.2809, "lr": 0.00013766828773623352, "epoch": 0.4875, "percentage": 24.38, "elapsed_time": "1:04:03", "remaining_time": "3:18:44"}
|
|
{"current_steps": 40, "total_steps": 160, "loss": 1.2248, "lr": 0.00013656854249492382, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "1:05:41", "remaining_time": "3:17:05"}
|
|
{"current_steps": 41, "total_steps": 160, "loss": 1.2653, "lr": 0.0001354469890036509, "epoch": 0.5125, "percentage": 25.62, "elapsed_time": "1:07:48", "remaining_time": "3:16:48"}
|
|
{"current_steps": 42, "total_steps": 160, "loss": 1.2687, "lr": 0.00013430405964263536, "epoch": 0.525, "percentage": 26.25, "elapsed_time": "1:09:27", "remaining_time": "3:15:07"}
|
|
{"current_steps": 43, "total_steps": 160, "loss": 1.269, "lr": 0.00013314019503290255, "epoch": 0.5375, "percentage": 26.88, "elapsed_time": "1:11:05", "remaining_time": "3:13:27"}
|
|
{"current_steps": 44, "total_steps": 160, "loss": 1.2559, "lr": 0.00013195584386641469, "epoch": 0.55, "percentage": 27.5, "elapsed_time": "1:12:44", "remaining_time": "3:11:45"}
|
|
{"current_steps": 45, "total_steps": 160, "loss": 1.2477, "lr": 0.00013075146273309164, "epoch": 0.5625, "percentage": 28.12, "elapsed_time": "1:14:22", "remaining_time": "3:10:03"}
|
|
{"current_steps": 46, "total_steps": 160, "loss": 1.2358, "lr": 0.00012952751594478675, "epoch": 0.575, "percentage": 28.75, "elapsed_time": "1:16:00", "remaining_time": "3:08:21"}
|
|
{"current_steps": 47, "total_steps": 160, "loss": 1.2444, "lr": 0.0001282844753562857, "epoch": 0.5875, "percentage": 29.38, "elapsed_time": "1:17:38", "remaining_time": "3:06:39"}
|
|
{"current_steps": 48, "total_steps": 160, "loss": 1.2535, "lr": 0.00012702282018339786, "epoch": 0.6, "percentage": 30.0, "elapsed_time": "1:19:16", "remaining_time": "3:04:58"}
|
|
{"current_steps": 49, "total_steps": 160, "loss": 1.2361, "lr": 0.00012574303681820898, "epoch": 0.6125, "percentage": 30.63, "elapsed_time": "1:20:54", "remaining_time": "3:03:17"}
|
|
{"current_steps": 50, "total_steps": 160, "loss": 1.2283, "lr": 0.0001244456186415682, "epoch": 0.625, "percentage": 31.25, "elapsed_time": "1:22:32", "remaining_time": "3:01:36"}
|
|
{"current_steps": 51, "total_steps": 160, "loss": 1.2401, "lr": 0.00012313106583288004, "epoch": 0.6375, "percentage": 31.87, "elapsed_time": "1:24:10", "remaining_time": "2:59:53"}
|
|
{"current_steps": 52, "total_steps": 160, "loss": 1.2399, "lr": 0.00012179988517727591, "epoch": 0.65, "percentage": 32.5, "elapsed_time": "1:25:47", "remaining_time": "2:58:11"}
|
|
{"current_steps": 53, "total_steps": 160, "loss": 1.2441, "lr": 0.00012045258987023879, "epoch": 0.6625, "percentage": 33.12, "elapsed_time": "1:27:25", "remaining_time": "2:56:30"}
|
|
{"current_steps": 54, "total_steps": 160, "loss": 1.253, "lr": 0.00011908969931975641, "epoch": 0.675, "percentage": 33.75, "elapsed_time": "1:29:04", "remaining_time": "2:54:50"}
|
|
{"current_steps": 55, "total_steps": 160, "loss": 1.2586, "lr": 0.00011771173894607985, "epoch": 0.6875, "percentage": 34.38, "elapsed_time": "1:30:41", "remaining_time": "2:53:09"}
|
|
{"current_steps": 56, "total_steps": 160, "loss": 1.2643, "lr": 0.00011631923997916375, "epoch": 0.7, "percentage": 35.0, "elapsed_time": "1:32:20", "remaining_time": "2:51:28"}
|
|
{"current_steps": 57, "total_steps": 160, "loss": 1.2657, "lr": 0.00011491273925386736, "epoch": 0.7125, "percentage": 35.62, "elapsed_time": "1:33:58", "remaining_time": "2:49:48"}
|
|
{"current_steps": 58, "total_steps": 160, "loss": 1.2526, "lr": 0.00011349277900299426, "epoch": 0.725, "percentage": 36.25, "elapsed_time": "1:35:36", "remaining_time": "2:48:08"}
|
|
{"current_steps": 59, "total_steps": 160, "loss": 1.2402, "lr": 0.00011205990664825127, "epoch": 0.7375, "percentage": 36.88, "elapsed_time": "1:37:13", "remaining_time": "2:46:26"}
|
|
{"current_steps": 60, "total_steps": 160, "loss": 1.2264, "lr": 0.00011061467458920719, "epoch": 0.75, "percentage": 37.5, "elapsed_time": "1:38:51", "remaining_time": "2:44:46"}
|
|
{"current_steps": 61, "total_steps": 160, "loss": 1.22, "lr": 0.00010915763999033201, "epoch": 0.7625, "percentage": 38.12, "elapsed_time": "1:40:30", "remaining_time": "2:43:06"}
|
|
{"current_steps": 62, "total_steps": 160, "loss": 1.203, "lr": 0.00010768936456619945, "epoch": 0.775, "percentage": 38.75, "elapsed_time": "1:42:08", "remaining_time": "2:41:27"}
|
|
{"current_steps": 63, "total_steps": 160, "loss": 1.2295, "lr": 0.0001062104143649355, "epoch": 0.7875, "percentage": 39.38, "elapsed_time": "1:43:47", "remaining_time": "2:39:47"}
|
|
{"current_steps": 64, "total_steps": 160, "loss": 1.1936, "lr": 0.0001047213595499958, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "1:45:25", "remaining_time": "2:38:08"}
|
|
{"current_steps": 65, "total_steps": 160, "loss": 1.1927, "lr": 0.000103222774180357, "epoch": 0.8125, "percentage": 40.62, "elapsed_time": "1:47:03", "remaining_time": "2:36:27"}
|
|
{"current_steps": 66, "total_steps": 160, "loss": 1.2116, "lr": 0.00010171523598920594, "epoch": 0.825, "percentage": 41.25, "elapsed_time": "1:48:41", "remaining_time": "2:34:47"}
|
|
{"current_steps": 67, "total_steps": 160, "loss": 1.2002, "lr": 0.00010019932616121264, "epoch": 0.8375, "percentage": 41.88, "elapsed_time": "1:50:19", "remaining_time": "2:33:08"}
|
|
{"current_steps": 68, "total_steps": 160, "loss": 1.2225, "lr": 9.867562910847246e-05, "epoch": 0.85, "percentage": 42.5, "elapsed_time": "1:51:57", "remaining_time": "2:31:28"}
|
|
{"current_steps": 69, "total_steps": 160, "loss": 1.1982, "lr": 9.714473224520406e-05, "epoch": 0.8625, "percentage": 43.12, "elapsed_time": "1:53:35", "remaining_time": "2:29:48"}
|
|
{"current_steps": 70, "total_steps": 160, "loss": 1.2015, "lr": 9.560722576129029e-05, "epoch": 0.875, "percentage": 43.75, "elapsed_time": "1:55:13", "remaining_time": "2:28:08"}
|
|
{"current_steps": 71, "total_steps": 160, "loss": 1.2013, "lr": 9.406370239474839e-05, "epoch": 0.8875, "percentage": 44.38, "elapsed_time": "1:56:51", "remaining_time": "2:26:28"}
|
|
{"current_steps": 72, "total_steps": 160, "loss": 1.2101, "lr": 9.251475720321848e-05, "epoch": 0.9, "percentage": 45.0, "elapsed_time": "1:58:28", "remaining_time": "2:24:48"}
|
|
{"current_steps": 73, "total_steps": 160, "loss": 1.1889, "lr": 9.096098733455746e-05, "epoch": 0.9125, "percentage": 45.62, "elapsed_time": "2:00:06", "remaining_time": "2:23:08"}
|
|
{"current_steps": 74, "total_steps": 160, "loss": 1.1915, "lr": 8.940299179662703e-05, "epoch": 0.925, "percentage": 46.25, "elapsed_time": "2:01:43", "remaining_time": "2:21:27"}
|
|
{"current_steps": 75, "total_steps": 160, "loss": 1.2018, "lr": 8.784137122636488e-05, "epoch": 0.9375, "percentage": 46.88, "elapsed_time": "2:03:21", "remaining_time": "2:19:47"}
|
|
{"current_steps": 76, "total_steps": 160, "loss": 1.188, "lr": 8.627672765822762e-05, "epoch": 0.95, "percentage": 47.5, "elapsed_time": "2:04:58", "remaining_time": "2:18:07"}
|
|
{"current_steps": 77, "total_steps": 160, "loss": 1.1821, "lr": 8.470966429209512e-05, "epoch": 0.9625, "percentage": 48.12, "elapsed_time": "2:06:36", "remaining_time": "2:16:28"}
|
|
{"current_steps": 78, "total_steps": 160, "loss": 1.1687, "lr": 8.31407852607255e-05, "epoch": 0.975, "percentage": 48.75, "elapsed_time": "2:08:14", "remaining_time": "2:14:49"}
|
|
{"current_steps": 79, "total_steps": 160, "loss": 1.2024, "lr": 8.157069539685026e-05, "epoch": 0.9875, "percentage": 49.38, "elapsed_time": "2:09:52", "remaining_time": "2:13:10"}
|
|
{"current_steps": 80, "total_steps": 160, "loss": 1.1721, "lr": 8e-05, "epoch": 1.0, "percentage": 50.0, "elapsed_time": "2:11:30", "remaining_time": "2:11:30"}
|
|
{"current_steps": 81, "total_steps": 160, "loss": 1.2239, "lr": 7.842930460314975e-05, "epoch": 1.0125, "percentage": 50.62, "elapsed_time": "2:13:40", "remaining_time": "2:10:22"}
|
|
{"current_steps": 82, "total_steps": 160, "loss": 1.2615, "lr": 7.685921473927454e-05, "epoch": 1.025, "percentage": 51.25, "elapsed_time": "2:15:18", "remaining_time": "2:08:42"}
|
|
{"current_steps": 83, "total_steps": 160, "loss": 1.2229, "lr": 7.529033570790488e-05, "epoch": 1.0375, "percentage": 51.88, "elapsed_time": "2:16:57", "remaining_time": "2:07:03"}
|
|
{"current_steps": 84, "total_steps": 160, "loss": 1.2115, "lr": 7.372327234177242e-05, "epoch": 1.05, "percentage": 52.5, "elapsed_time": "2:18:36", "remaining_time": "2:05:24"}
|
|
{"current_steps": 85, "total_steps": 160, "loss": 1.2484, "lr": 7.215862877363515e-05, "epoch": 1.0625, "percentage": 53.12, "elapsed_time": "2:20:15", "remaining_time": "2:03:45"}
|
|
{"current_steps": 86, "total_steps": 160, "loss": 1.2583, "lr": 7.0597008203373e-05, "epoch": 1.075, "percentage": 53.75, "elapsed_time": "2:21:54", "remaining_time": "2:02:06"}
|
|
{"current_steps": 87, "total_steps": 160, "loss": 1.2448, "lr": 6.903901266544258e-05, "epoch": 1.0875, "percentage": 54.37, "elapsed_time": "2:23:32", "remaining_time": "2:00:26"}
|
|
{"current_steps": 88, "total_steps": 160, "loss": 1.2694, "lr": 6.748524279678152e-05, "epoch": 1.1, "percentage": 55.0, "elapsed_time": "2:25:11", "remaining_time": "1:58:47"}
|
|
{"current_steps": 89, "total_steps": 160, "loss": 1.2213, "lr": 6.593629760525164e-05, "epoch": 1.1125, "percentage": 55.62, "elapsed_time": "2:26:51", "remaining_time": "1:57:09"}
|
|
{"current_steps": 90, "total_steps": 160, "loss": 1.2448, "lr": 6.439277423870975e-05, "epoch": 1.125, "percentage": 56.25, "elapsed_time": "2:28:29", "remaining_time": "1:55:29"}
|
|
{"current_steps": 91, "total_steps": 160, "loss": 1.2967, "lr": 6.285526775479596e-05, "epoch": 1.1375, "percentage": 56.88, "elapsed_time": "2:30:07", "remaining_time": "1:53:50"}
|
|
{"current_steps": 92, "total_steps": 160, "loss": 1.2426, "lr": 6.13243708915276e-05, "epoch": 1.15, "percentage": 57.5, "elapsed_time": "2:31:46", "remaining_time": "1:52:10"}
|
|
{"current_steps": 93, "total_steps": 160, "loss": 1.2834, "lr": 5.9800673838787364e-05, "epoch": 1.1625, "percentage": 58.13, "elapsed_time": "2:33:24", "remaining_time": "1:50:31"}
|
|
{"current_steps": 94, "total_steps": 160, "loss": 1.2123, "lr": 5.828476401079407e-05, "epoch": 1.175, "percentage": 58.75, "elapsed_time": "2:35:03", "remaining_time": "1:48:52"}
|
|
{"current_steps": 95, "total_steps": 160, "loss": 1.2358, "lr": 5.677722581964303e-05, "epoch": 1.1875, "percentage": 59.38, "elapsed_time": "2:36:41", "remaining_time": "1:47:12"}
|
|
{"current_steps": 96, "total_steps": 160, "loss": 1.2278, "lr": 5.5278640450004216e-05, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "2:38:20", "remaining_time": "1:45:33"}
|
|
{"current_steps": 97, "total_steps": 160, "loss": 1.2044, "lr": 5.3789585635064534e-05, "epoch": 1.2125, "percentage": 60.62, "elapsed_time": "2:39:59", "remaining_time": "1:43:54"}
|
|
{"current_steps": 98, "total_steps": 160, "loss": 1.1828, "lr": 5.231063543380055e-05, "epoch": 1.225, "percentage": 61.25, "elapsed_time": "2:41:38", "remaining_time": "1:42:15"}
|
|
{"current_steps": 99, "total_steps": 160, "loss": 1.2169, "lr": 5.084236000966803e-05, "epoch": 1.2375, "percentage": 61.88, "elapsed_time": "2:43:16", "remaining_time": "1:40:36"}
|
|
{"current_steps": 100, "total_steps": 160, "loss": 1.2132, "lr": 4.9385325410792824e-05, "epoch": 1.25, "percentage": 62.5, "elapsed_time": "2:44:55", "remaining_time": "1:38:57"}
|
|
{"current_steps": 101, "total_steps": 160, "loss": 1.2336, "lr": 4.794009335174874e-05, "epoch": 1.2625, "percentage": 63.12, "elapsed_time": "2:46:33", "remaining_time": "1:37:17"}
|
|
{"current_steps": 102, "total_steps": 160, "loss": 1.2196, "lr": 4.650722099700578e-05, "epoch": 1.275, "percentage": 63.75, "elapsed_time": "2:48:11", "remaining_time": "1:35:38"}
|
|
{"current_steps": 103, "total_steps": 160, "loss": 1.2204, "lr": 4.508726074613262e-05, "epoch": 1.2875, "percentage": 64.38, "elapsed_time": "2:49:50", "remaining_time": "1:33:59"}
|
|
{"current_steps": 104, "total_steps": 160, "loss": 1.2468, "lr": 4.3680760020836266e-05, "epoch": 1.3, "percentage": 65.0, "elapsed_time": "2:51:28", "remaining_time": "1:32:20"}
|
|
{"current_steps": 105, "total_steps": 160, "loss": 1.1899, "lr": 4.2288261053920186e-05, "epoch": 1.3125, "percentage": 65.62, "elapsed_time": "2:53:07", "remaining_time": "1:30:41"}
|
|
{"current_steps": 106, "total_steps": 160, "loss": 1.2373, "lr": 4.0910300680243636e-05, "epoch": 1.325, "percentage": 66.25, "elapsed_time": "2:54:46", "remaining_time": "1:29:02"}
|
|
{"current_steps": 107, "total_steps": 160, "loss": 1.1971, "lr": 3.954741012976125e-05, "epoch": 1.3375, "percentage": 66.88, "elapsed_time": "2:56:25", "remaining_time": "1:27:23"}
|
|
{"current_steps": 108, "total_steps": 160, "loss": 1.2109, "lr": 3.8200114822724096e-05, "epoch": 1.35, "percentage": 67.5, "elapsed_time": "2:58:04", "remaining_time": "1:25:44"}
|
|
{"current_steps": 109, "total_steps": 160, "loss": 1.1777, "lr": 3.686893416711998e-05, "epoch": 1.3625, "percentage": 68.12, "elapsed_time": "2:59:42", "remaining_time": "1:24:05"}
|
|
{"current_steps": 110, "total_steps": 160, "loss": 1.2271, "lr": 3.5554381358431845e-05, "epoch": 1.375, "percentage": 68.75, "elapsed_time": "3:01:20", "remaining_time": "1:22:25"}
|
|
{"current_steps": 111, "total_steps": 160, "loss": 1.1753, "lr": 3.425696318179103e-05, "epoch": 1.3875, "percentage": 69.38, "elapsed_time": "3:02:58", "remaining_time": "1:20:46"}
|
|
{"current_steps": 112, "total_steps": 160, "loss": 1.216, "lr": 3.297717981660216e-05, "epoch": 1.4, "percentage": 70.0, "elapsed_time": "3:04:36", "remaining_time": "1:19:07"}
|
|
{"current_steps": 113, "total_steps": 160, "loss": 1.1956, "lr": 3.1715524643714286e-05, "epoch": 1.4125, "percentage": 70.62, "elapsed_time": "3:06:15", "remaining_time": "1:17:28"}
|
|
{"current_steps": 114, "total_steps": 160, "loss": 1.2017, "lr": 3.0472484055213276e-05, "epoch": 1.425, "percentage": 71.25, "elapsed_time": "3:07:53", "remaining_time": "1:15:49"}
|
|
{"current_steps": 115, "total_steps": 160, "loss": 1.1977, "lr": 2.9248537266908373e-05, "epoch": 1.4375, "percentage": 71.88, "elapsed_time": "3:09:32", "remaining_time": "1:14:10"}
|
|
{"current_steps": 116, "total_steps": 160, "loss": 1.2068, "lr": 2.804415613358532e-05, "epoch": 1.45, "percentage": 72.5, "elapsed_time": "3:11:10", "remaining_time": "1:12:30"}
|
|
{"current_steps": 117, "total_steps": 160, "loss": 1.1919, "lr": 2.685980496709749e-05, "epoch": 1.4625, "percentage": 73.12, "elapsed_time": "3:12:49", "remaining_time": "1:10:51"}
|
|
{"current_steps": 118, "total_steps": 160, "loss": 1.1824, "lr": 2.569594035736466e-05, "epoch": 1.475, "percentage": 73.75, "elapsed_time": "3:14:28", "remaining_time": "1:09:13"}
|
|
{"current_steps": 119, "total_steps": 160, "loss": 1.2038, "lr": 2.4553010996349143e-05, "epoch": 1.4875, "percentage": 74.38, "elapsed_time": "3:16:06", "remaining_time": "1:07:34"}
|
|
{"current_steps": 120, "total_steps": 160, "loss": 1.1529, "lr": 2.3431457505076205e-05, "epoch": 1.5, "percentage": 75.0, "elapsed_time": "3:17:45", "remaining_time": "1:05:55"}
|
|
{"current_steps": 121, "total_steps": 160, "loss": 1.192, "lr": 2.2331712263766495e-05, "epoch": 1.5125, "percentage": 75.62, "elapsed_time": "3:19:54", "remaining_time": "1:04:25"}
|
|
{"current_steps": 122, "total_steps": 160, "loss": 1.1969, "lr": 2.1254199245145177e-05, "epoch": 1.525, "percentage": 76.25, "elapsed_time": "3:21:33", "remaining_time": "1:02:46"}
|
|
{"current_steps": 123, "total_steps": 160, "loss": 1.1987, "lr": 2.0199333850992245e-05, "epoch": 1.5375, "percentage": 76.88, "elapsed_time": "3:23:11", "remaining_time": "1:01:07"}
|
|
{"current_steps": 124, "total_steps": 160, "loss": 1.1871, "lr": 1.9167522751997527e-05, "epoch": 1.55, "percentage": 77.5, "elapsed_time": "3:24:49", "remaining_time": "0:59:28"}
|
|
{"current_steps": 125, "total_steps": 160, "loss": 1.1808, "lr": 1.815916373098104e-05, "epoch": 1.5625, "percentage": 78.12, "elapsed_time": "3:26:28", "remaining_time": "0:57:48"}
|
|
{"current_steps": 126, "total_steps": 160, "loss": 1.1695, "lr": 1.7174645529540424e-05, "epoch": 1.575, "percentage": 78.75, "elapsed_time": "3:28:06", "remaining_time": "0:56:09"}
|
|
{"current_steps": 127, "total_steps": 160, "loss": 1.1789, "lr": 1.621434769818344e-05, "epoch": 1.5875, "percentage": 79.38, "elapsed_time": "3:29:44", "remaining_time": "0:54:29"}
|
|
{"current_steps": 128, "total_steps": 160, "loss": 1.2016, "lr": 1.5278640450004213e-05, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "3:31:22", "remaining_time": "0:52:50"}
|
|
{"current_steps": 129, "total_steps": 160, "loss": 1.1712, "lr": 1.4367884517958914e-05, "epoch": 1.6125, "percentage": 80.62, "elapsed_time": "3:33:00", "remaining_time": "0:51:11"}
|
|
{"current_steps": 130, "total_steps": 160, "loss": 1.1647, "lr": 1.3482431015796373e-05, "epoch": 1.625, "percentage": 81.25, "elapsed_time": "3:34:38", "remaining_time": "0:49:32"}
|
|
{"current_steps": 131, "total_steps": 160, "loss": 1.1781, "lr": 1.2622621302697087e-05, "epoch": 1.6375, "percentage": 81.88, "elapsed_time": "3:36:16", "remaining_time": "0:47:52"}
|
|
{"current_steps": 132, "total_steps": 160, "loss": 1.1777, "lr": 1.1788786851672628e-05, "epoch": 1.65, "percentage": 82.5, "elapsed_time": "3:37:54", "remaining_time": "0:46:13"}
|
|
{"current_steps": 133, "total_steps": 160, "loss": 1.1838, "lr": 1.0981249121776654e-05, "epoch": 1.6625, "percentage": 83.12, "elapsed_time": "3:39:32", "remaining_time": "0:44:34"}
|
|
{"current_steps": 134, "total_steps": 160, "loss": 1.1926, "lr": 1.0200319434176227e-05, "epoch": 1.675, "percentage": 83.75, "elapsed_time": "3:41:10", "remaining_time": "0:42:54"}
|
|
{"current_steps": 135, "total_steps": 160, "loss": 1.185, "lr": 9.446298852131605e-06, "epoch": 1.6875, "percentage": 84.38, "elapsed_time": "3:42:48", "remaining_time": "0:41:15"}
|
|
{"current_steps": 136, "total_steps": 160, "loss": 1.1891, "lr": 8.719478064930578e-06, "epoch": 1.7, "percentage": 85.0, "elapsed_time": "3:44:26", "remaining_time": "0:39:36"}
|
|
{"current_steps": 137, "total_steps": 160, "loss": 1.1973, "lr": 8.020137275822297e-06, "epoch": 1.7125, "percentage": 85.62, "elapsed_time": "3:46:05", "remaining_time": "0:37:57"}
|
|
{"current_steps": 138, "total_steps": 160, "loss": 1.1824, "lr": 7.348546093993492e-06, "epoch": 1.725, "percentage": 86.25, "elapsed_time": "3:47:43", "remaining_time": "0:36:18"}
|
|
{"current_steps": 139, "total_steps": 160, "loss": 1.1724, "lr": 6.704963430629132e-06, "epoch": 1.7375, "percentage": 86.88, "elapsed_time": "3:49:20", "remaining_time": "0:34:38"}
|
|
{"current_steps": 140, "total_steps": 160, "loss": 1.1647, "lr": 6.0896373990970614e-06, "epoch": 1.75, "percentage": 87.5, "elapsed_time": "3:50:58", "remaining_time": "0:32:59"}
|
|
{"current_steps": 141, "total_steps": 160, "loss": 1.1553, "lr": 5.502805219295715e-06, "epoch": 1.7625, "percentage": 88.12, "elapsed_time": "3:52:37", "remaining_time": "0:31:20"}
|
|
{"current_steps": 142, "total_steps": 160, "loss": 1.1432, "lr": 4.944693126201276e-06, "epoch": 1.775, "percentage": 88.75, "elapsed_time": "3:54:15", "remaining_time": "0:29:41"}
|
|
{"current_steps": 143, "total_steps": 160, "loss": 1.1704, "lr": 4.415516282649756e-06, "epoch": 1.7875, "percentage": 89.38, "elapsed_time": "3:55:53", "remaining_time": "0:28:02"}
|
|
{"current_steps": 144, "total_steps": 160, "loss": 1.1378, "lr": 3.915478696387718e-06, "epoch": 1.8, "percentage": 90.0, "elapsed_time": "3:57:32", "remaining_time": "0:26:23"}
|
|
{"current_steps": 145, "total_steps": 160, "loss": 1.1372, "lr": 3.4447731414232945e-06, "epoch": 1.8125, "percentage": 90.62, "elapsed_time": "3:59:10", "remaining_time": "0:24:44"}
|
|
{"current_steps": 146, "total_steps": 160, "loss": 1.1577, "lr": 3.0035810837082267e-06, "epoch": 1.825, "percentage": 91.25, "elapsed_time": "4:00:47", "remaining_time": "0:23:05"}
|
|
{"current_steps": 147, "total_steps": 160, "loss": 1.1482, "lr": 2.5920726111792195e-06, "epoch": 1.8375, "percentage": 91.88, "elapsed_time": "4:02:26", "remaining_time": "0:21:26"}
|
|
{"current_steps": 148, "total_steps": 160, "loss": 1.1699, "lr": 2.2104063681858757e-06, "epoch": 1.85, "percentage": 92.5, "elapsed_time": "4:04:04", "remaining_time": "0:19:47"}
|
|
{"current_steps": 149, "total_steps": 160, "loss": 1.1475, "lr": 1.8587294943302092e-06, "epoch": 1.8625, "percentage": 93.12, "elapsed_time": "4:05:42", "remaining_time": "0:18:08"}
|
|
{"current_steps": 150, "total_steps": 160, "loss": 1.1529, "lr": 1.5371775677415656e-06, "epoch": 1.875, "percentage": 93.75, "elapsed_time": "4:07:20", "remaining_time": "0:16:29"}
|
|
{"current_steps": 151, "total_steps": 160, "loss": 1.1544, "lr": 1.2458745528086723e-06, "epoch": 1.8875, "percentage": 94.38, "elapsed_time": "4:08:57", "remaining_time": "0:14:50"}
|
|
{"current_steps": 152, "total_steps": 160, "loss": 1.1637, "lr": 9.849327523889873e-07, "epoch": 1.9, "percentage": 95.0, "elapsed_time": "4:10:35", "remaining_time": "0:13:11"}
|
|
{"current_steps": 153, "total_steps": 160, "loss": 1.1429, "lr": 7.5445276451382e-07, "epoch": 1.9125, "percentage": 95.62, "elapsed_time": "4:12:13", "remaining_time": "0:11:32"}
|
|
{"current_steps": 154, "total_steps": 160, "loss": 1.1471, "lr": 5.545234436058966e-07, "epoch": 1.925, "percentage": 96.25, "elapsed_time": "4:13:50", "remaining_time": "0:09:53"}
|
|
{"current_steps": 155, "total_steps": 160, "loss": 1.1584, "lr": 3.852218662242546e-07, "epoch": 1.9375, "percentage": 96.88, "elapsed_time": "4:15:27", "remaining_time": "0:08:14"}
|
|
{"current_steps": 156, "total_steps": 160, "loss": 1.1464, "lr": 2.466133013497629e-07, "epoch": 1.95, "percentage": 97.5, "elapsed_time": "4:17:05", "remaining_time": "0:06:35"}
|
|
{"current_steps": 157, "total_steps": 160, "loss": 1.1413, "lr": 1.3875118522273412e-07, "epoch": 1.9625, "percentage": 98.12, "elapsed_time": "4:18:43", "remaining_time": "0:04:56"}
|
|
{"current_steps": 158, "total_steps": 160, "loss": 1.1291, "lr": 6.167710074216792e-08, "epoch": 1.975, "percentage": 98.75, "elapsed_time": "4:20:21", "remaining_time": "0:03:17"}
|
|
{"current_steps": 159, "total_steps": 160, "loss": 1.1628, "lr": 1.5420761434814523e-08, "epoch": 1.9875, "percentage": 99.38, "elapsed_time": "4:21:59", "remaining_time": "0:01:38"}
|
|
{"current_steps": 160, "total_steps": 160, "loss": 1.1336, "lr": 0.0, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "4:23:37", "remaining_time": "0:00:00"}
|
|
{"current_steps": 160, "total_steps": 160, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "4:24:08", "remaining_time": "0:00:00"}
|