Files
daft-qwen2.5-coder-3b-instr…/trainer_log.jsonl

28 lines
5.4 KiB
Plaintext
Raw Permalink Normal View History

{"current_steps": 130, "total_steps": 387, "loss": 0.11126101016998291, "lr": 8.438497294267117e-06, "epoch": 1.0077594568380213, "percentage": 33.59, "elapsed_time": "0:18:26", "remaining_time": "0:36:26"}
{"current_steps": 140, "total_steps": 387, "loss": 0.10776399374008179, "lr": 8.097241806078616e-06, "epoch": 1.0853540252182348, "percentage": 36.18, "elapsed_time": "0:36:50", "remaining_time": "1:04:59"}
{"current_steps": 150, "total_steps": 387, "loss": 0.10431833267211914, "lr": 7.730761885468486e-06, "epoch": 1.162948593598448, "percentage": 38.76, "elapsed_time": "0:55:23", "remaining_time": "1:27:31"}
{"current_steps": 160, "total_steps": 387, "loss": 0.10304663181304932, "lr": 7.342042203498952e-06, "epoch": 1.2405431619786615, "percentage": 41.34, "elapsed_time": "1:14:02", "remaining_time": "1:45:03"}
{"current_steps": 170, "total_steps": 387, "loss": 0.09784629344940185, "lr": 6.934248555404197e-06, "epoch": 1.3181377303588748, "percentage": 43.93, "elapsed_time": "1:32:53", "remaining_time": "1:58:33"}
{"current_steps": 180, "total_steps": 387, "loss": 0.09537227749824524, "lr": 6.510702077847864e-06, "epoch": 1.3957322987390883, "percentage": 46.51, "elapsed_time": "1:51:08", "remaining_time": "2:07:48"}
{"current_steps": 190, "total_steps": 387, "loss": 0.09520423412322998, "lr": 6.074852201055121e-06, "epoch": 1.4733268671193016, "percentage": 49.1, "elapsed_time": "2:09:17", "remaining_time": "2:14:03"}
{"current_steps": 200, "total_steps": 387, "loss": 0.09088362455368042, "lr": 5.630248556101448e-06, "epoch": 1.5509214354995149, "percentage": 51.68, "elapsed_time": "2:27:46", "remaining_time": "2:18:10"}
{"current_steps": 210, "total_steps": 387, "loss": 0.0899280071258545, "lr": 5.180512066149682e-06, "epoch": 1.6285160038797284, "percentage": 54.26, "elapsed_time": "2:46:36", "remaining_time": "2:20:25"}
{"current_steps": 220, "total_steps": 387, "loss": 0.0881616234779358, "lr": 4.729305457072913e-06, "epoch": 1.706110572259942, "percentage": 56.85, "elapsed_time": "3:04:52", "remaining_time": "2:20:20"}
{"current_steps": 230, "total_steps": 387, "loss": 0.08638249635696411, "lr": 4.280303427629404e-06, "epoch": 1.7837051406401552, "percentage": 59.43, "elapsed_time": "3:23:30", "remaining_time": "2:18:54"}
{"current_steps": 240, "total_steps": 387, "loss": 0.08716154098510742, "lr": 3.8371627221284495e-06, "epoch": 1.8612997090203685, "percentage": 62.02, "elapsed_time": "3:41:53", "remaining_time": "2:15:54"}
{"current_steps": 250, "total_steps": 387, "loss": 0.08580605983734131, "lr": 3.403492349320101e-06, "epoch": 1.938894277400582, "percentage": 64.6, "elapsed_time": "4:00:25", "remaining_time": "2:11:44"}
{"current_steps": 260, "total_steps": 387, "loss": 0.08316840529441834, "lr": 2.982824190050958e-06, "epoch": 2.0155189136760425, "percentage": 67.18, "elapsed_time": "4:18:27", "remaining_time": "2:06:14"}
{"current_steps": 270, "total_steps": 387, "loss": 0.08091338872909545, "lr": 2.5785842330619038e-06, "epoch": 2.093113482056256, "percentage": 69.77, "elapsed_time": "4:37:00", "remaining_time": "2:00:02"}
{"current_steps": 280, "total_steps": 387, "loss": 0.08085420131683349, "lr": 2.1940646731880887e-06, "epoch": 2.1707080504364695, "percentage": 72.35, "elapsed_time": "4:55:04", "remaining_time": "1:52:45"}
{"current_steps": 290, "total_steps": 387, "loss": 0.08156624436378479, "lr": 1.8323970991978823e-06, "epoch": 2.248302618816683, "percentage": 74.94, "elapsed_time": "5:14:09", "remaining_time": "1:45:04"}
{"current_steps": 300, "total_steps": 387, "loss": 0.0808843195438385, "lr": 1.4965269896332884e-06, "epoch": 2.325897187196896, "percentage": 77.52, "elapsed_time": "5:32:45", "remaining_time": "1:36:30"}
{"current_steps": 310, "total_steps": 387, "loss": 0.07979943156242371, "lr": 1.1891897243618184e-06, "epoch": 2.4034917555771096, "percentage": 80.1, "elapsed_time": "5:50:50", "remaining_time": "1:27:08"}
{"current_steps": 320, "total_steps": 387, "loss": 0.08049517869949341, "lr": 9.128883072055411e-07, "epoch": 2.481086323957323, "percentage": 82.69, "elapsed_time": "6:09:14", "remaining_time": "1:17:18"}
{"current_steps": 330, "total_steps": 387, "loss": 0.08011389374732972, "lr": 6.698729810778065e-07, "epoch": 2.558680892337536, "percentage": 85.27, "elapsed_time": "6:27:50", "remaining_time": "1:06:59"}
{"current_steps": 340, "total_steps": 387, "loss": 0.08163015246391296, "lr": 4.6212290164521554e-07, "epoch": 2.6362754607177497, "percentage": 87.86, "elapsed_time": "6:46:09", "remaining_time": "0:56:08"}
{"current_steps": 350, "total_steps": 387, "loss": 0.08051948547363282, "lr": 2.9133001876746004e-07, "epoch": 2.713870029097963, "percentage": 90.44, "elapsed_time": "7:04:35", "remaining_time": "0:44:53"}
{"current_steps": 360, "total_steps": 387, "loss": 0.07719261646270752, "lr": 1.5888529698718347e-07, "epoch": 2.7914645974781767, "percentage": 93.02, "elapsed_time": "7:23:07", "remaining_time": "0:33:14"}
{"current_steps": 370, "total_steps": 387, "loss": 0.08128957152366638, "lr": 6.58673872923693e-08, "epoch": 2.86905916585839, "percentage": 95.61, "elapsed_time": "7:42:08", "remaining_time": "0:21:14"}
{"current_steps": 380, "total_steps": 387, "loss": 0.07743191719055176, "lr": 1.3033842410251074e-08, "epoch": 2.946653734238603, "percentage": 98.19, "elapsed_time": "8:00:28", "remaining_time": "0:08:51"}
{"current_steps": 387, "total_steps": 387, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "8:13:28", "remaining_time": "0:00:00"}