Model: huseyinatahaninan/appworld_distillation_sft-SFT-Qwen3-4B-Instruct-2507 Source: Original Platform
32 lines
5.1 KiB
JSON
32 lines
5.1 KiB
JSON
{"current_steps": 1, "total_steps": 20, "loss": 0.8433, "lr": 0.0, "epoch": 0.5, "percentage": 5.0, "elapsed_time": "0:00:23", "remaining_time": "0:07:26"}
|
|
{"current_steps": 2, "total_steps": 20, "loss": 0.9102, "lr": 2.5e-06, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:00:45", "remaining_time": "0:06:48"}
|
|
{"current_steps": 2, "total_steps": 20, "eval_loss": 0.8433753848075867, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:00:54", "remaining_time": "0:08:09"}
|
|
{"current_steps": 3, "total_steps": 20, "loss": 0.8534, "lr": 5e-06, "epoch": 1.5, "percentage": 15.0, "elapsed_time": "0:01:16", "remaining_time": "0:07:13"}
|
|
{"current_steps": 4, "total_steps": 20, "loss": 0.6723, "lr": 4.962019382530521e-06, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "0:01:38", "remaining_time": "0:06:34"}
|
|
{"current_steps": 4, "total_steps": 20, "eval_loss": 0.4704136848449707, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "0:01:47", "remaining_time": "0:07:08"}
|
|
{"current_steps": 5, "total_steps": 20, "loss": 0.4748, "lr": 4.849231551964771e-06, "epoch": 2.5, "percentage": 25.0, "elapsed_time": "0:02:13", "remaining_time": "0:06:39"}
|
|
{"current_steps": 6, "total_steps": 20, "loss": 0.3556, "lr": 4.665063509461098e-06, "epoch": 3.0, "percentage": 30.0, "elapsed_time": "0:02:34", "remaining_time": "0:05:59"}
|
|
{"current_steps": 6, "total_steps": 20, "eval_loss": 0.3564150631427765, "epoch": 3.0, "percentage": 30.0, "elapsed_time": "0:02:42", "remaining_time": "0:06:19"}
|
|
{"current_steps": 7, "total_steps": 20, "loss": 0.3381, "lr": 4.415111107797445e-06, "epoch": 3.5, "percentage": 35.0, "elapsed_time": "0:03:06", "remaining_time": "0:05:45"}
|
|
{"current_steps": 8, "total_steps": 20, "loss": 0.3261, "lr": 4.106969024216348e-06, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "0:03:28", "remaining_time": "0:05:12"}
|
|
{"current_steps": 8, "total_steps": 20, "eval_loss": 0.32391461730003357, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "0:03:36", "remaining_time": "0:05:25"}
|
|
{"current_steps": 9, "total_steps": 20, "loss": 0.3077, "lr": 3.7500000000000005e-06, "epoch": 4.5, "percentage": 45.0, "elapsed_time": "0:03:59", "remaining_time": "0:04:52"}
|
|
{"current_steps": 10, "total_steps": 20, "loss": 0.2697, "lr": 3.3550503583141726e-06, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "0:04:22", "remaining_time": "0:04:22"}
|
|
{"current_steps": 10, "total_steps": 20, "eval_loss": 0.29709815979003906, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "0:04:30", "remaining_time": "0:04:30"}
|
|
{"current_steps": 11, "total_steps": 20, "loss": 0.2657, "lr": 2.9341204441673267e-06, "epoch": 5.5, "percentage": 55.0, "elapsed_time": "0:04:58", "remaining_time": "0:04:04"}
|
|
{"current_steps": 12, "total_steps": 20, "loss": 0.2508, "lr": 2.5e-06, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "0:05:21", "remaining_time": "0:03:34"}
|
|
{"current_steps": 12, "total_steps": 20, "eval_loss": 0.27973881363868713, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "0:05:29", "remaining_time": "0:03:39"}
|
|
{"current_steps": 13, "total_steps": 20, "loss": 0.2478, "lr": 2.0658795558326745e-06, "epoch": 6.5, "percentage": 65.0, "elapsed_time": "0:05:55", "remaining_time": "0:03:11"}
|
|
{"current_steps": 14, "total_steps": 20, "loss": 0.225, "lr": 1.6449496416858285e-06, "epoch": 7.0, "percentage": 70.0, "elapsed_time": "0:06:19", "remaining_time": "0:02:42"}
|
|
{"current_steps": 14, "total_steps": 20, "eval_loss": 0.2676139175891876, "epoch": 7.0, "percentage": 70.0, "elapsed_time": "0:06:28", "remaining_time": "0:02:46"}
|
|
{"current_steps": 15, "total_steps": 20, "loss": 0.2245, "lr": 1.2500000000000007e-06, "epoch": 7.5, "percentage": 75.0, "elapsed_time": "0:06:52", "remaining_time": "0:02:17"}
|
|
{"current_steps": 16, "total_steps": 20, "loss": 0.2327, "lr": 8.930309757836517e-07, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "0:07:15", "remaining_time": "0:01:48"}
|
|
{"current_steps": 16, "total_steps": 20, "eval_loss": 0.2616689205169678, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "0:07:23", "remaining_time": "0:01:50"}
|
|
{"current_steps": 17, "total_steps": 20, "loss": 0.2284, "lr": 5.848888922025553e-07, "epoch": 8.5, "percentage": 85.0, "elapsed_time": "0:07:47", "remaining_time": "0:01:22"}
|
|
{"current_steps": 18, "total_steps": 20, "loss": 0.2064, "lr": 3.3493649053890325e-07, "epoch": 9.0, "percentage": 90.0, "elapsed_time": "0:08:09", "remaining_time": "0:00:54"}
|
|
{"current_steps": 18, "total_steps": 20, "eval_loss": 0.25935298204421997, "epoch": 9.0, "percentage": 90.0, "elapsed_time": "0:08:18", "remaining_time": "0:00:55"}
|
|
{"current_steps": 19, "total_steps": 20, "loss": 0.2038, "lr": 1.507684480352292e-07, "epoch": 9.5, "percentage": 95.0, "elapsed_time": "0:08:40", "remaining_time": "0:00:27"}
|
|
{"current_steps": 20, "total_steps": 20, "loss": 0.22, "lr": 3.798061746947995e-08, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "0:09:04", "remaining_time": "0:00:00"}
|
|
{"current_steps": 20, "total_steps": 20, "eval_loss": 0.25876814126968384, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "0:09:52", "remaining_time": "0:00:00"}
|
|
{"current_steps": 20, "total_steps": 20, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "0:09:52", "remaining_time": "0:00:00"}
|