Model: huseyinatahaninan/appworld_distillation_sft_v2-SFT-Qwen3-8B Source: Original Platform
77 lines
13 KiB
JSON
77 lines
13 KiB
JSON
{"current_steps": 1, "total_steps": 50, "loss": 1.2369, "lr": 0.0, "epoch": 0.5714285714285714, "percentage": 2.0, "elapsed_time": "0:00:41", "remaining_time": "0:33:58"}
|
|
{"current_steps": 2, "total_steps": 50, "loss": 1.1697, "lr": 1.0000000000000002e-06, "epoch": 1.0, "percentage": 4.0, "elapsed_time": "0:01:08", "remaining_time": "0:27:23"}
|
|
{"current_steps": 2, "total_steps": 50, "eval_loss": 1.2943594455718994, "epoch": 1.0, "percentage": 4.0, "elapsed_time": "0:01:22", "remaining_time": "0:32:59"}
|
|
{"current_steps": 3, "total_steps": 50, "loss": 1.2156, "lr": 2.0000000000000003e-06, "epoch": 1.5714285714285714, "percentage": 6.0, "elapsed_time": "0:01:58", "remaining_time": "0:30:51"}
|
|
{"current_steps": 4, "total_steps": 50, "loss": 1.0781, "lr": 3e-06, "epoch": 2.0, "percentage": 8.0, "elapsed_time": "0:02:24", "remaining_time": "0:27:43"}
|
|
{"current_steps": 4, "total_steps": 50, "eval_loss": 1.1406848430633545, "epoch": 2.0, "percentage": 8.0, "elapsed_time": "0:02:36", "remaining_time": "0:30:02"}
|
|
{"current_steps": 5, "total_steps": 50, "loss": 0.9982, "lr": 4.000000000000001e-06, "epoch": 2.571428571428571, "percentage": 10.0, "elapsed_time": "0:03:11", "remaining_time": "0:28:44"}
|
|
{"current_steps": 6, "total_steps": 50, "loss": 0.9806, "lr": 5e-06, "epoch": 3.0, "percentage": 12.0, "elapsed_time": "0:03:37", "remaining_time": "0:26:35"}
|
|
{"current_steps": 6, "total_steps": 50, "eval_loss": 1.0041135549545288, "epoch": 3.0, "percentage": 12.0, "elapsed_time": "0:03:49", "remaining_time": "0:28:03"}
|
|
{"current_steps": 7, "total_steps": 50, "loss": 0.9273, "lr": 4.993910125649561e-06, "epoch": 3.571428571428571, "percentage": 14.0, "elapsed_time": "0:04:25", "remaining_time": "0:27:10"}
|
|
{"current_steps": 8, "total_steps": 50, "loss": 0.9093, "lr": 4.975670171853926e-06, "epoch": 4.0, "percentage": 16.0, "elapsed_time": "0:04:50", "remaining_time": "0:25:26"}
|
|
{"current_steps": 8, "total_steps": 50, "eval_loss": 0.9050876498222351, "epoch": 4.0, "percentage": 16.0, "elapsed_time": "0:05:02", "remaining_time": "0:26:29"}
|
|
{"current_steps": 9, "total_steps": 50, "loss": 0.86, "lr": 4.9453690018345144e-06, "epoch": 4.571428571428571, "percentage": 18.0, "elapsed_time": "0:05:38", "remaining_time": "0:25:41"}
|
|
{"current_steps": 10, "total_steps": 50, "loss": 0.8595, "lr": 4.903154239845798e-06, "epoch": 5.0, "percentage": 20.0, "elapsed_time": "0:06:02", "remaining_time": "0:24:09"}
|
|
{"current_steps": 10, "total_steps": 50, "eval_loss": 0.8866418600082397, "epoch": 5.0, "percentage": 20.0, "elapsed_time": "0:06:14", "remaining_time": "0:24:58"}
|
|
{"current_steps": 11, "total_steps": 50, "loss": 0.7986, "lr": 4.849231551964771e-06, "epoch": 5.571428571428571, "percentage": 22.0, "elapsed_time": "0:06:49", "remaining_time": "0:24:11"}
|
|
{"current_steps": 12, "total_steps": 50, "loss": 0.7688, "lr": 4.783863644106502e-06, "epoch": 6.0, "percentage": 24.0, "elapsed_time": "0:07:16", "remaining_time": "0:23:02"}
|
|
{"current_steps": 12, "total_steps": 50, "eval_loss": 0.8012941479682922, "epoch": 6.0, "percentage": 24.0, "elapsed_time": "0:07:28", "remaining_time": "0:23:40"}
|
|
{"current_steps": 13, "total_steps": 50, "loss": 0.7405, "lr": 4.707368982147318e-06, "epoch": 6.571428571428571, "percentage": 26.0, "elapsed_time": "0:08:04", "remaining_time": "0:22:59"}
|
|
{"current_steps": 14, "total_steps": 50, "loss": 0.7223, "lr": 4.620120240391065e-06, "epoch": 7.0, "percentage": 28.0, "elapsed_time": "0:08:29", "remaining_time": "0:21:50"}
|
|
{"current_steps": 14, "total_steps": 50, "eval_loss": 0.7613986730575562, "epoch": 7.0, "percentage": 28.0, "elapsed_time": "0:08:41", "remaining_time": "0:22:21"}
|
|
{"current_steps": 15, "total_steps": 50, "loss": 0.7031, "lr": 4.522542485937369e-06, "epoch": 7.571428571428571, "percentage": 30.0, "elapsed_time": "0:09:17", "remaining_time": "0:21:40"}
|
|
{"current_steps": 16, "total_steps": 50, "loss": 0.689, "lr": 4.415111107797445e-06, "epoch": 8.0, "percentage": 32.0, "elapsed_time": "0:09:43", "remaining_time": "0:20:40"}
|
|
{"current_steps": 16, "total_steps": 50, "eval_loss": 0.727152407169342, "epoch": 8.0, "percentage": 32.0, "elapsed_time": "0:09:55", "remaining_time": "0:21:06"}
|
|
{"current_steps": 17, "total_steps": 50, "loss": 0.6511, "lr": 4.2983495008466285e-06, "epoch": 8.571428571428571, "percentage": 34.0, "elapsed_time": "0:10:30", "remaining_time": "0:20:23"}
|
|
{"current_steps": 18, "total_steps": 50, "loss": 0.6641, "lr": 4.172826515897146e-06, "epoch": 9.0, "percentage": 36.0, "elapsed_time": "0:10:56", "remaining_time": "0:19:26"}
|
|
{"current_steps": 18, "total_steps": 50, "eval_loss": 0.7126601934432983, "epoch": 9.0, "percentage": 36.0, "elapsed_time": "0:11:08", "remaining_time": "0:19:48"}
|
|
{"current_steps": 19, "total_steps": 50, "loss": 0.6349, "lr": 4.039153688314146e-06, "epoch": 9.571428571428571, "percentage": 38.0, "elapsed_time": "0:11:43", "remaining_time": "0:19:07"}
|
|
{"current_steps": 20, "total_steps": 50, "loss": 0.5795, "lr": 3.897982258676867e-06, "epoch": 10.0, "percentage": 40.0, "elapsed_time": "0:12:09", "remaining_time": "0:18:14"}
|
|
{"current_steps": 20, "total_steps": 50, "eval_loss": 0.6720197796821594, "epoch": 10.0, "percentage": 40.0, "elapsed_time": "0:12:21", "remaining_time": "0:18:32"}
|
|
{"current_steps": 21, "total_steps": 50, "loss": 0.5678, "lr": 3.7500000000000005e-06, "epoch": 10.571428571428571, "percentage": 42.0, "elapsed_time": "0:12:57", "remaining_time": "0:17:53"}
|
|
{"current_steps": 22, "total_steps": 50, "loss": 0.5451, "lr": 3.595927866972694e-06, "epoch": 11.0, "percentage": 44.0, "elapsed_time": "0:13:24", "remaining_time": "0:17:03"}
|
|
{"current_steps": 22, "total_steps": 50, "eval_loss": 0.655051589012146, "epoch": 11.0, "percentage": 44.0, "elapsed_time": "0:13:36", "remaining_time": "0:17:18"}
|
|
{"current_steps": 23, "total_steps": 50, "loss": 0.5435, "lr": 3.436516483539781e-06, "epoch": 11.571428571428571, "percentage": 46.0, "elapsed_time": "0:14:11", "remaining_time": "0:16:40"}
|
|
{"current_steps": 24, "total_steps": 50, "loss": 0.5059, "lr": 3.272542485937369e-06, "epoch": 12.0, "percentage": 48.0, "elapsed_time": "0:14:37", "remaining_time": "0:15:50"}
|
|
{"current_steps": 24, "total_steps": 50, "eval_loss": 0.6408958435058594, "epoch": 12.0, "percentage": 48.0, "elapsed_time": "0:14:49", "remaining_time": "0:16:03"}
|
|
{"current_steps": 25, "total_steps": 50, "loss": 0.5038, "lr": 3.1048047389991693e-06, "epoch": 12.571428571428571, "percentage": 50.0, "elapsed_time": "0:15:23", "remaining_time": "0:15:23"}
|
|
{"current_steps": 26, "total_steps": 50, "loss": 0.5035, "lr": 2.9341204441673267e-06, "epoch": 13.0, "percentage": 52.0, "elapsed_time": "0:15:50", "remaining_time": "0:14:37"}
|
|
{"current_steps": 26, "total_steps": 50, "eval_loss": 0.6351635456085205, "epoch": 13.0, "percentage": 52.0, "elapsed_time": "0:16:02", "remaining_time": "0:14:48"}
|
|
{"current_steps": 27, "total_steps": 50, "loss": 0.489, "lr": 2.761321158169134e-06, "epoch": 13.571428571428571, "percentage": 54.0, "elapsed_time": "0:16:38", "remaining_time": "0:14:10"}
|
|
{"current_steps": 28, "total_steps": 50, "loss": 0.484, "lr": 2.587248741756253e-06, "epoch": 14.0, "percentage": 56.0, "elapsed_time": "0:17:04", "remaining_time": "0:13:24"}
|
|
{"current_steps": 28, "total_steps": 50, "eval_loss": 0.6280523538589478, "epoch": 14.0, "percentage": 56.0, "elapsed_time": "0:17:16", "remaining_time": "0:13:34"}
|
|
{"current_steps": 29, "total_steps": 50, "loss": 0.4683, "lr": 2.4127512582437486e-06, "epoch": 14.571428571428571, "percentage": 58.0, "elapsed_time": "0:17:52", "remaining_time": "0:12:56"}
|
|
{"current_steps": 30, "total_steps": 50, "loss": 0.4436, "lr": 2.238678841830867e-06, "epoch": 15.0, "percentage": 60.0, "elapsed_time": "0:18:18", "remaining_time": "0:12:12"}
|
|
{"current_steps": 30, "total_steps": 50, "eval_loss": 0.6252209544181824, "epoch": 15.0, "percentage": 60.0, "elapsed_time": "0:18:30", "remaining_time": "0:12:20"}
|
|
{"current_steps": 31, "total_steps": 50, "loss": 0.4466, "lr": 2.0658795558326745e-06, "epoch": 15.571428571428571, "percentage": 62.0, "elapsed_time": "0:19:05", "remaining_time": "0:11:42"}
|
|
{"current_steps": 32, "total_steps": 50, "loss": 0.4347, "lr": 1.895195261000831e-06, "epoch": 16.0, "percentage": 64.0, "elapsed_time": "0:19:32", "remaining_time": "0:10:59"}
|
|
{"current_steps": 32, "total_steps": 50, "eval_loss": 0.6249921321868896, "epoch": 16.0, "percentage": 64.0, "elapsed_time": "0:19:44", "remaining_time": "0:11:06"}
|
|
{"current_steps": 33, "total_steps": 50, "loss": 0.4275, "lr": 1.7274575140626318e-06, "epoch": 16.571428571428573, "percentage": 66.0, "elapsed_time": "0:20:19", "remaining_time": "0:10:28"}
|
|
{"current_steps": 34, "total_steps": 50, "loss": 0.4139, "lr": 1.56348351646022e-06, "epoch": 17.0, "percentage": 68.0, "elapsed_time": "0:20:45", "remaining_time": "0:09:45"}
|
|
{"current_steps": 34, "total_steps": 50, "eval_loss": 0.6253374218940735, "epoch": 17.0, "percentage": 68.0, "elapsed_time": "0:20:57", "remaining_time": "0:09:51"}
|
|
{"current_steps": 35, "total_steps": 50, "loss": 0.4033, "lr": 1.4040721330273063e-06, "epoch": 17.571428571428573, "percentage": 70.0, "elapsed_time": "0:21:33", "remaining_time": "0:09:14"}
|
|
{"current_steps": 36, "total_steps": 50, "loss": 0.4108, "lr": 1.2500000000000007e-06, "epoch": 18.0, "percentage": 72.0, "elapsed_time": "0:21:58", "remaining_time": "0:08:32"}
|
|
{"current_steps": 36, "total_steps": 50, "eval_loss": 0.6265431642532349, "epoch": 18.0, "percentage": 72.0, "elapsed_time": "0:22:11", "remaining_time": "0:08:37"}
|
|
{"current_steps": 37, "total_steps": 50, "loss": 0.3948, "lr": 1.1020177413231334e-06, "epoch": 18.571428571428573, "percentage": 74.0, "elapsed_time": "0:22:45", "remaining_time": "0:07:59"}
|
|
{"current_steps": 38, "total_steps": 50, "loss": 0.3969, "lr": 9.608463116858544e-07, "epoch": 19.0, "percentage": 76.0, "elapsed_time": "0:23:12", "remaining_time": "0:07:19"}
|
|
{"current_steps": 38, "total_steps": 50, "eval_loss": 0.6287420392036438, "epoch": 19.0, "percentage": 76.0, "elapsed_time": "0:23:24", "remaining_time": "0:07:23"}
|
|
{"current_steps": 39, "total_steps": 50, "loss": 0.3965, "lr": 8.271734841028553e-07, "epoch": 19.571428571428573, "percentage": 78.0, "elapsed_time": "0:23:59", "remaining_time": "0:06:45"}
|
|
{"current_steps": 40, "total_steps": 50, "loss": 0.3825, "lr": 7.016504991533727e-07, "epoch": 20.0, "percentage": 80.0, "elapsed_time": "0:24:25", "remaining_time": "0:06:06"}
|
|
{"current_steps": 40, "total_steps": 50, "eval_loss": 0.6303004026412964, "epoch": 20.0, "percentage": 80.0, "elapsed_time": "0:24:37", "remaining_time": "0:06:09"}
|
|
{"current_steps": 41, "total_steps": 50, "loss": 0.3825, "lr": 5.848888922025553e-07, "epoch": 20.571428571428573, "percentage": 82.0, "elapsed_time": "0:25:14", "remaining_time": "0:05:32"}
|
|
{"current_steps": 42, "total_steps": 50, "loss": 0.3839, "lr": 4.774575140626317e-07, "epoch": 21.0, "percentage": 84.0, "elapsed_time": "0:25:39", "remaining_time": "0:04:53"}
|
|
{"current_steps": 42, "total_steps": 50, "eval_loss": 0.6313385367393494, "epoch": 21.0, "percentage": 84.0, "elapsed_time": "0:25:51", "remaining_time": "0:04:55"}
|
|
{"current_steps": 43, "total_steps": 50, "loss": 0.3821, "lr": 3.798797596089351e-07, "epoch": 21.571428571428573, "percentage": 86.0, "elapsed_time": "0:26:25", "remaining_time": "0:04:18"}
|
|
{"current_steps": 44, "total_steps": 50, "loss": 0.3699, "lr": 2.9263101785268253e-07, "epoch": 22.0, "percentage": 88.0, "elapsed_time": "0:26:51", "remaining_time": "0:03:39"}
|
|
{"current_steps": 44, "total_steps": 50, "eval_loss": 0.6325893998146057, "epoch": 22.0, "percentage": 88.0, "elapsed_time": "0:27:03", "remaining_time": "0:03:41"}
|
|
{"current_steps": 45, "total_steps": 50, "loss": 0.3652, "lr": 2.1613635589349756e-07, "epoch": 22.571428571428573, "percentage": 90.0, "elapsed_time": "0:27:39", "remaining_time": "0:03:04"}
|
|
{"current_steps": 46, "total_steps": 50, "loss": 0.3871, "lr": 1.507684480352292e-07, "epoch": 23.0, "percentage": 92.0, "elapsed_time": "0:28:05", "remaining_time": "0:02:26"}
|
|
{"current_steps": 46, "total_steps": 50, "eval_loss": 0.6336179971694946, "epoch": 23.0, "percentage": 92.0, "elapsed_time": "0:28:17", "remaining_time": "0:02:27"}
|
|
{"current_steps": 47, "total_steps": 50, "loss": 0.3612, "lr": 9.684576015420277e-08, "epoch": 23.571428571428573, "percentage": 94.0, "elapsed_time": "0:28:52", "remaining_time": "0:01:50"}
|
|
{"current_steps": 48, "total_steps": 50, "loss": 0.382, "lr": 5.463099816548578e-08, "epoch": 24.0, "percentage": 96.0, "elapsed_time": "0:29:19", "remaining_time": "0:01:13"}
|
|
{"current_steps": 48, "total_steps": 50, "eval_loss": 0.6337578892707825, "epoch": 24.0, "percentage": 96.0, "elapsed_time": "0:29:31", "remaining_time": "0:01:13"}
|
|
{"current_steps": 49, "total_steps": 50, "loss": 0.3611, "lr": 2.4329828146074096e-08, "epoch": 24.571428571428573, "percentage": 98.0, "elapsed_time": "0:30:07", "remaining_time": "0:00:36"}
|
|
{"current_steps": 50, "total_steps": 50, "loss": 0.3879, "lr": 6.089874350439507e-09, "epoch": 25.0, "percentage": 100.0, "elapsed_time": "0:30:33", "remaining_time": "0:00:00"}
|
|
{"current_steps": 50, "total_steps": 50, "eval_loss": 0.6342211961746216, "epoch": 25.0, "percentage": 100.0, "elapsed_time": "0:31:34", "remaining_time": "0:00:00"}
|
|
{"current_steps": 50, "total_steps": 50, "epoch": 25.0, "percentage": 100.0, "elapsed_time": "0:31:34", "remaining_time": "0:00:00"}
|