Files
swesmith-unified-10000__Qwe…/trainer_log.jsonl

58 lines
10 KiB
Plaintext
Raw Normal View History

{"current_steps": 5, "total_steps": 259, "loss": 0.3116, "lr": 6.153846153846155e-06, "epoch": 0.13513513513513514, "percentage": 1.93, "elapsed_time": "0:02:40", "remaining_time": "2:15:51"}
{"current_steps": 10, "total_steps": 259, "loss": 0.2587, "lr": 1.3846153846153847e-05, "epoch": 0.2702702702702703, "percentage": 3.86, "elapsed_time": "0:05:13", "remaining_time": "2:10:12"}
{"current_steps": 15, "total_steps": 259, "loss": 0.2116, "lr": 2.153846153846154e-05, "epoch": 0.40540540540540543, "percentage": 5.79, "elapsed_time": "0:07:47", "remaining_time": "2:06:50"}
{"current_steps": 20, "total_steps": 259, "loss": 0.188, "lr": 2.923076923076923e-05, "epoch": 0.5405405405405406, "percentage": 7.72, "elapsed_time": "0:10:19", "remaining_time": "2:03:18"}
{"current_steps": 25, "total_steps": 259, "loss": 0.1511, "lr": 3.692307692307693e-05, "epoch": 0.6756756756756757, "percentage": 9.65, "elapsed_time": "0:12:52", "remaining_time": "2:00:28"}
{"current_steps": 30, "total_steps": 259, "loss": 0.1382, "lr": 3.998364045590232e-05, "epoch": 0.8108108108108109, "percentage": 11.58, "elapsed_time": "0:15:25", "remaining_time": "1:57:47"}
{"current_steps": 35, "total_steps": 259, "loss": 0.1277, "lr": 3.988376236895231e-05, "epoch": 0.9459459459459459, "percentage": 13.51, "elapsed_time": "0:17:58", "remaining_time": "1:55:03"}
{"current_steps": 40, "total_steps": 259, "loss": 0.1171, "lr": 3.969354804762473e-05, "epoch": 1.0810810810810811, "percentage": 15.44, "elapsed_time": "0:20:30", "remaining_time": "1:52:18"}
{"current_steps": 45, "total_steps": 259, "loss": 0.1152, "lr": 3.9413861676735034e-05, "epoch": 1.2162162162162162, "percentage": 17.37, "elapsed_time": "0:23:03", "remaining_time": "1:49:40"}
{"current_steps": 50, "total_steps": 259, "loss": 0.1102, "lr": 3.9045973931977495e-05, "epoch": 1.3513513513513513, "percentage": 19.31, "elapsed_time": "0:25:35", "remaining_time": "1:46:56"}
{"current_steps": 55, "total_steps": 259, "loss": 0.106, "lr": 3.8591556206970594e-05, "epoch": 1.4864864864864864, "percentage": 21.24, "elapsed_time": "0:28:07", "remaining_time": "1:44:20"}
{"current_steps": 60, "total_steps": 259, "loss": 0.1059, "lr": 3.805267301975424e-05, "epoch": 1.6216216216216215, "percentage": 23.17, "elapsed_time": "0:30:40", "remaining_time": "1:41:45"}
{"current_steps": 65, "total_steps": 259, "loss": 0.1042, "lr": 3.743177263323758e-05, "epoch": 1.7567567567567568, "percentage": 25.1, "elapsed_time": "0:33:13", "remaining_time": "1:39:10"}
{"current_steps": 70, "total_steps": 259, "loss": 0.0995, "lr": 3.673167593221097e-05, "epoch": 1.8918918918918919, "percentage": 27.03, "elapsed_time": "0:35:47", "remaining_time": "1:36:38"}
{"current_steps": 75, "total_steps": 259, "loss": 0.0975, "lr": 3.5955563607456025e-05, "epoch": 2.027027027027027, "percentage": 28.96, "elapsed_time": "0:38:23", "remaining_time": "1:34:12"}
{"current_steps": 80, "total_steps": 259, "loss": 0.0949, "lr": 3.510696170517927e-05, "epoch": 2.1621621621621623, "percentage": 30.89, "elapsed_time": "0:40:56", "remaining_time": "1:31:37"}
{"current_steps": 85, "total_steps": 259, "loss": 0.0905, "lr": 3.418972560742133e-05, "epoch": 2.2972972972972974, "percentage": 32.82, "elapsed_time": "0:43:29", "remaining_time": "1:29:02"}
{"current_steps": 90, "total_steps": 259, "loss": 0.091, "lr": 3.3208022516222195e-05, "epoch": 2.4324324324324325, "percentage": 34.75, "elapsed_time": "0:46:02", "remaining_time": "1:26:27"}
{"current_steps": 95, "total_steps": 259, "loss": 0.0876, "lr": 3.2166312521120775e-05, "epoch": 2.5675675675675675, "percentage": 36.68, "elapsed_time": "0:48:34", "remaining_time": "1:23:52"}
{"current_steps": 100, "total_steps": 259, "loss": 0.0865, "lr": 3.106932833600314e-05, "epoch": 2.7027027027027026, "percentage": 38.61, "elapsed_time": "0:51:06", "remaining_time": "1:21:16"}
{"current_steps": 105, "total_steps": 259, "loss": 0.0901, "lr": 2.9922053797359406e-05, "epoch": 2.8378378378378377, "percentage": 40.54, "elapsed_time": "0:53:39", "remaining_time": "1:18:42"}
{"current_steps": 110, "total_steps": 259, "loss": 0.0865, "lr": 2.8729701221636294e-05, "epoch": 2.972972972972973, "percentage": 42.47, "elapsed_time": "0:56:10", "remaining_time": "1:16:05"}
{"current_steps": 115, "total_steps": 259, "loss": 0.0843, "lr": 2.74976877245558e-05, "epoch": 3.108108108108108, "percentage": 44.4, "elapsed_time": "0:58:41", "remaining_time": "1:13:29"}
{"current_steps": 120, "total_steps": 259, "loss": 0.0776, "lr": 2.6231610609986442e-05, "epoch": 3.2432432432432434, "percentage": 46.33, "elapsed_time": "1:01:13", "remaining_time": "1:10:55"}
{"current_steps": 125, "total_steps": 259, "loss": 0.0813, "lr": 2.493722194018082e-05, "epoch": 3.3783783783783785, "percentage": 48.26, "elapsed_time": "1:03:45", "remaining_time": "1:08:20"}
{"current_steps": 130, "total_steps": 259, "loss": 0.0815, "lr": 2.362040240291227e-05, "epoch": 3.5135135135135136, "percentage": 50.19, "elapsed_time": "1:06:17", "remaining_time": "1:05:46"}
{"current_steps": 135, "total_steps": 259, "loss": 0.0778, "lr": 2.228713459423804e-05, "epoch": 3.6486486486486487, "percentage": 52.12, "elapsed_time": "1:08:48", "remaining_time": "1:03:12"}
{"current_steps": 140, "total_steps": 259, "loss": 0.0817, "lr": 2.094347583827102e-05, "epoch": 3.7837837837837838, "percentage": 54.05, "elapsed_time": "1:11:20", "remaining_time": "1:00:38"}
{"current_steps": 145, "total_steps": 259, "loss": 0.076, "lr": 1.9595530667445775e-05, "epoch": 3.918918918918919, "percentage": 55.98, "elapsed_time": "1:13:53", "remaining_time": "0:58:05"}
{"current_steps": 150, "total_steps": 259, "loss": 0.0787, "lr": 1.824942308830696e-05, "epoch": 4.054054054054054, "percentage": 57.92, "elapsed_time": "1:16:24", "remaining_time": "0:55:31"}
{"current_steps": 155, "total_steps": 259, "loss": 0.0752, "lr": 1.691126875882263e-05, "epoch": 4.1891891891891895, "percentage": 59.85, "elapsed_time": "1:18:55", "remaining_time": "0:52:57"}
{"current_steps": 160, "total_steps": 259, "loss": 0.0712, "lr": 1.5587147203626934e-05, "epoch": 4.324324324324325, "percentage": 61.78, "elapsed_time": "1:21:27", "remaining_time": "0:50:24"}
{"current_steps": 165, "total_steps": 259, "loss": 0.0713, "lr": 1.4283074193424379e-05, "epoch": 4.45945945945946, "percentage": 63.71, "elapsed_time": "1:23:58", "remaining_time": "0:47:50"}
{"current_steps": 170, "total_steps": 259, "loss": 0.0738, "lr": 1.3004974414041987e-05, "epoch": 4.594594594594595, "percentage": 65.64, "elapsed_time": "1:26:30", "remaining_time": "0:45:17"}
{"current_steps": 175, "total_steps": 259, "loss": 0.0711, "lr": 1.1758654549299735e-05, "epoch": 4.72972972972973, "percentage": 67.57, "elapsed_time": "1:29:01", "remaining_time": "0:42:43"}
{"current_steps": 180, "total_steps": 259, "loss": 0.0727, "lr": 1.0549776899989686e-05, "epoch": 4.864864864864865, "percentage": 69.5, "elapsed_time": "1:31:31", "remaining_time": "0:40:10"}
{"current_steps": 185, "total_steps": 259, "loss": 0.074, "lr": 9.3838336588184e-06, "epoch": 5.0, "percentage": 71.43, "elapsed_time": "1:34:02", "remaining_time": "0:37:37"}
{"current_steps": 190, "total_steps": 259, "loss": 0.0709, "lr": 8.266121958187246e-06, "epoch": 5.135135135135135, "percentage": 73.36, "elapsed_time": "1:36:34", "remaining_time": "0:35:04"}
{"current_steps": 195, "total_steps": 259, "loss": 0.0683, "lr": 7.201719804173797e-06, "epoch": 5.27027027027027, "percentage": 75.29, "elapsed_time": "1:39:04", "remaining_time": "0:32:31"}
{"current_steps": 200, "total_steps": 259, "loss": 0.0676, "lr": 6.1954630060516005e-06, "epoch": 5.405405405405405, "percentage": 77.22, "elapsed_time": "1:41:36", "remaining_time": "0:29:58"}
{"current_steps": 205, "total_steps": 259, "loss": 0.0698, "lr": 5.2519232061624255e-06, "epoch": 5.54054054054054, "percentage": 79.15, "elapsed_time": "1:44:06", "remaining_time": "0:27:25"}
{"current_steps": 210, "total_steps": 259, "loss": 0.0693, "lr": 4.375387109955953e-06, "epoch": 5.675675675675675, "percentage": 81.08, "elapsed_time": "1:46:37", "remaining_time": "0:24:52"}
{"current_steps": 215, "total_steps": 259, "loss": 0.0661, "lr": 3.569837010559505e-06, "epoch": 5.8108108108108105, "percentage": 83.01, "elapsed_time": "1:49:08", "remaining_time": "0:22:20"}
{"current_steps": 220, "total_steps": 259, "loss": 0.0695, "lr": 2.838932696358798e-06, "epoch": 5.945945945945946, "percentage": 84.94, "elapsed_time": "1:51:40", "remaining_time": "0:19:47"}
{"current_steps": 225, "total_steps": 259, "loss": 0.0681, "lr": 2.1859948237874517e-06, "epoch": 6.081081081081081, "percentage": 86.87, "elapsed_time": "1:54:10", "remaining_time": "0:17:15"}
{"current_steps": 230, "total_steps": 259, "loss": 0.0663, "lr": 1.6139898308664093e-06, "epoch": 6.216216216216216, "percentage": 88.8, "elapsed_time": "1:56:41", "remaining_time": "0:14:42"}
{"current_steps": 235, "total_steps": 259, "loss": 0.0674, "lr": 1.1255164600341816e-06, "epoch": 6.351351351351352, "percentage": 90.73, "elapsed_time": "1:59:13", "remaining_time": "0:12:10"}
{"current_steps": 240, "total_steps": 259, "loss": 0.0666, "lr": 7.227939514977422e-07, "epoch": 6.486486486486487, "percentage": 92.66, "elapsed_time": "2:01:45", "remaining_time": "0:09:38"}
{"current_steps": 245, "total_steps": 259, "loss": 0.0697, "lr": 4.0765196074406433e-07, "epoch": 6.621621621621622, "percentage": 94.59, "elapsed_time": "2:04:17", "remaining_time": "0:07:06"}
{"current_steps": 250, "total_steps": 259, "loss": 0.0666, "lr": 1.8152224601943435e-07, "epoch": 6.756756756756757, "percentage": 96.53, "elapsed_time": "2:06:48", "remaining_time": "0:04:33"}
{"current_steps": 255, "total_steps": 259, "loss": 0.0668, "lr": 4.5432163541960785e-08, "epoch": 6.891891891891892, "percentage": 98.46, "elapsed_time": "2:09:20", "remaining_time": "0:02:01"}
{"current_steps": 259, "total_steps": 259, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "2:11:32", "remaining_time": "0:00:00"}
{"current_steps": 259, "total_steps": 259, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
{"current_steps": 259, "total_steps": 259, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
{"current_steps": 259, "total_steps": 259, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
{"current_steps": 259, "total_steps": 259, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}
{"current_steps": 259, "total_steps": 259, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "0:00:00", "remaining_time": "0:00:00"}