Files
Llama3.2-3B_Paper_Impact_me…/trainer_log.jsonl

35 lines
6.4 KiB
Plaintext
Raw Normal View History

{"current_steps": 5, "total_steps": 166, "loss": 0.284, "lr": 4.705882352941177e-06, "epoch": 0.030211480362537766, "percentage": 3.01, "elapsed_time": "0:00:38", "remaining_time": "0:20:24"}
{"current_steps": 10, "total_steps": 166, "loss": 0.091, "lr": 1.0588235294117648e-05, "epoch": 0.06042296072507553, "percentage": 6.02, "elapsed_time": "0:01:15", "remaining_time": "0:19:38"}
{"current_steps": 15, "total_steps": 166, "loss": 0.0881, "lr": 1.647058823529412e-05, "epoch": 0.09063444108761329, "percentage": 9.04, "elapsed_time": "0:01:52", "remaining_time": "0:18:51"}
{"current_steps": 20, "total_steps": 166, "loss": 0.0856, "lr": 1.9991110182465032e-05, "epoch": 0.12084592145015106, "percentage": 12.05, "elapsed_time": "0:02:29", "remaining_time": "0:18:10"}
{"current_steps": 25, "total_steps": 166, "loss": 0.0776, "lr": 1.9891281165856876e-05, "epoch": 0.1510574018126888, "percentage": 15.06, "elapsed_time": "0:03:06", "remaining_time": "0:17:30"}
{"current_steps": 30, "total_steps": 166, "loss": 0.0796, "lr": 1.968162302997659e-05, "epoch": 0.18126888217522658, "percentage": 18.07, "elapsed_time": "0:03:43", "remaining_time": "0:16:51"}
{"current_steps": 35, "total_steps": 166, "loss": 0.0775, "lr": 1.9364463741042694e-05, "epoch": 0.21148036253776434, "percentage": 21.08, "elapsed_time": "0:04:20", "remaining_time": "0:16:15"}
{"current_steps": 40, "total_steps": 166, "loss": 0.0776, "lr": 1.8943324918225495e-05, "epoch": 0.24169184290030213, "percentage": 24.1, "elapsed_time": "0:04:58", "remaining_time": "0:15:38"}
{"current_steps": 45, "total_steps": 166, "loss": 0.0778, "lr": 1.8422882730893323e-05, "epoch": 0.2719033232628399, "percentage": 27.11, "elapsed_time": "0:05:35", "remaining_time": "0:15:00"}
{"current_steps": 50, "total_steps": 166, "loss": 0.0776, "lr": 1.7808915976161364e-05, "epoch": 0.3021148036253776, "percentage": 30.12, "elapsed_time": "0:06:11", "remaining_time": "0:14:21"}
{"current_steps": 55, "total_steps": 166, "loss": 0.0787, "lr": 1.710824191327075e-05, "epoch": 0.3323262839879154, "percentage": 33.13, "elapsed_time": "0:06:47", "remaining_time": "0:13:42"}
{"current_steps": 60, "total_steps": 166, "loss": 0.079, "lr": 1.632864056726917e-05, "epoch": 0.36253776435045315, "percentage": 36.14, "elapsed_time": "0:07:23", "remaining_time": "0:13:03"}
{"current_steps": 65, "total_steps": 166, "loss": 0.0776, "lr": 1.5478768342496872e-05, "epoch": 0.39274924471299094, "percentage": 39.16, "elapsed_time": "0:08:01", "remaining_time": "0:12:27"}
{"current_steps": 70, "total_steps": 166, "loss": 0.0779, "lr": 1.4568061905081874e-05, "epoch": 0.4229607250755287, "percentage": 42.17, "elapsed_time": "0:08:37", "remaining_time": "0:11:50"}
{"current_steps": 75, "total_steps": 166, "loss": 0.0782, "lr": 1.3606633401697557e-05, "epoch": 0.45317220543806647, "percentage": 45.18, "elapsed_time": "0:09:15", "remaining_time": "0:11:13"}
{"current_steps": 80, "total_steps": 166, "loss": 0.0791, "lr": 1.2605158178034656e-05, "epoch": 0.48338368580060426, "percentage": 48.19, "elapsed_time": "0:09:52", "remaining_time": "0:10:36"}
{"current_steps": 85, "total_steps": 166, "loss": 0.0792, "lr": 1.157475624372018e-05, "epoch": 0.513595166163142, "percentage": 51.2, "elapsed_time": "0:10:29", "remaining_time": "0:10:00"}
{"current_steps": 90, "total_steps": 166, "loss": 0.0779, "lr": 1.0526868799852797e-05, "epoch": 0.5438066465256798, "percentage": 54.22, "elapsed_time": "0:11:06", "remaining_time": "0:09:23"}
{"current_steps": 95, "total_steps": 166, "loss": 0.0781, "lr": 9.473131200147205e-06, "epoch": 0.5740181268882175, "percentage": 57.23, "elapsed_time": "0:11:43", "remaining_time": "0:08:45"}
{"current_steps": 100, "total_steps": 166, "loss": 0.0771, "lr": 8.425243756279824e-06, "epoch": 0.6042296072507553, "percentage": 60.24, "elapsed_time": "0:12:20", "remaining_time": "0:08:08"}
{"current_steps": 105, "total_steps": 166, "loss": 0.0771, "lr": 7.394841821965345e-06, "epoch": 0.6344410876132931, "percentage": 63.25, "elapsed_time": "0:12:58", "remaining_time": "0:07:32"}
{"current_steps": 110, "total_steps": 166, "loss": 0.0776, "lr": 6.3933665983024465e-06, "epoch": 0.6646525679758308, "percentage": 66.27, "elapsed_time": "0:13:35", "remaining_time": "0:06:55"}
{"current_steps": 115, "total_steps": 166, "loss": 0.0767, "lr": 5.431938094918132e-06, "epoch": 0.6948640483383686, "percentage": 69.28, "elapsed_time": "0:14:11", "remaining_time": "0:06:17"}
{"current_steps": 120, "total_steps": 166, "loss": 0.0778, "lr": 4.5212316575031325e-06, "epoch": 0.7250755287009063, "percentage": 72.29, "elapsed_time": "0:14:48", "remaining_time": "0:05:40"}
{"current_steps": 125, "total_steps": 166, "loss": 0.0776, "lr": 3.6713594327308343e-06, "epoch": 0.7552870090634441, "percentage": 75.3, "elapsed_time": "0:15:26", "remaining_time": "0:05:03"}
{"current_steps": 130, "total_steps": 166, "loss": 0.0769, "lr": 2.891758086729253e-06, "epoch": 0.7854984894259819, "percentage": 78.31, "elapsed_time": "0:16:02", "remaining_time": "0:04:26"}
{"current_steps": 135, "total_steps": 166, "loss": 0.0768, "lr": 2.19108402383864e-06, "epoch": 0.8157099697885196, "percentage": 81.33, "elapsed_time": "0:16:39", "remaining_time": "0:03:49"}
{"current_steps": 140, "total_steps": 166, "loss": 0.0765, "lr": 1.5771172691066793e-06, "epoch": 0.8459214501510574, "percentage": 84.34, "elapsed_time": "0:17:16", "remaining_time": "0:03:12"}
{"current_steps": 145, "total_steps": 166, "loss": 0.077, "lr": 1.0566750817745076e-06, "epoch": 0.8761329305135952, "percentage": 87.35, "elapsed_time": "0:17:53", "remaining_time": "0:02:35"}
{"current_steps": 150, "total_steps": 166, "loss": 0.0758, "lr": 6.355362589573078e-07, "epoch": 0.9063444108761329, "percentage": 90.36, "elapsed_time": "0:18:32", "remaining_time": "0:01:58"}
{"current_steps": 155, "total_steps": 166, "loss": 0.0775, "lr": 3.1837697002341293e-07, "epoch": 0.9365558912386707, "percentage": 93.37, "elapsed_time": "0:19:07", "remaining_time": "0:01:21"}
{"current_steps": 160, "total_steps": 166, "loss": 0.0758, "lr": 1.0871883414312778e-07, "epoch": 0.9667673716012085, "percentage": 96.39, "elapsed_time": "0:19:43", "remaining_time": "0:00:44"}
{"current_steps": 165, "total_steps": 166, "loss": 0.0768, "lr": 8.889817534969425e-09, "epoch": 0.9969788519637462, "percentage": 99.4, "elapsed_time": "0:20:21", "remaining_time": "0:00:07"}
{"current_steps": 166, "total_steps": 166, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:20:53", "remaining_time": "0:00:00"}