Files
polyalign-qwen2.5-1.5b-en-sft/trainer_log.jsonl
ModelHub XC 2d565ec78d 初始化项目,由ModelHub XC社区提供模型
Model: sathiiiii/polyalign-qwen2.5-1.5b-en-sft
Source: Original Platform
2026-06-01 02:22:17 +08:00

93 lines
18 KiB
JSON

{"current_steps": 100, "total_steps": 9132, "loss": 2.5966, "lr": 1.0831509846827136e-06, "epoch": 0.010950803515207929, "percentage": 1.1, "elapsed_time": "0:02:28", "remaining_time": "3:43:05"}
{"current_steps": 200, "total_steps": 9132, "loss": 2.3125, "lr": 2.177242888402626e-06, "epoch": 0.021901607030415857, "percentage": 2.19, "elapsed_time": "0:04:48", "remaining_time": "3:34:49"}
{"current_steps": 300, "total_steps": 9132, "loss": 2.1574, "lr": 3.2713347921225385e-06, "epoch": 0.03285241054562379, "percentage": 3.29, "elapsed_time": "0:07:09", "remaining_time": "3:30:57"}
{"current_steps": 400, "total_steps": 9132, "loss": 1.9882, "lr": 4.365426695842451e-06, "epoch": 0.043803214060831715, "percentage": 4.38, "elapsed_time": "0:09:31", "remaining_time": "3:28:02"}
{"current_steps": 500, "total_steps": 9132, "loss": 1.9221, "lr": 5.459518599562363e-06, "epoch": 0.05475401757603964, "percentage": 5.48, "elapsed_time": "0:11:52", "remaining_time": "3:25:04"}
{"current_steps": 600, "total_steps": 9132, "loss": 1.9077, "lr": 6.553610503282276e-06, "epoch": 0.06570482109124758, "percentage": 6.57, "elapsed_time": "0:14:14", "remaining_time": "3:22:37"}
{"current_steps": 700, "total_steps": 9132, "loss": 1.8748, "lr": 7.64770240700219e-06, "epoch": 0.0766556246064555, "percentage": 7.67, "elapsed_time": "0:16:34", "remaining_time": "3:19:36"}
{"current_steps": 800, "total_steps": 9132, "loss": 1.88, "lr": 8.741794310722102e-06, "epoch": 0.08760642812166343, "percentage": 8.76, "elapsed_time": "0:18:55", "remaining_time": "3:17:10"}
{"current_steps": 900, "total_steps": 9132, "loss": 1.8617, "lr": 9.835886214442013e-06, "epoch": 0.09855723163687136, "percentage": 9.86, "elapsed_time": "0:21:17", "remaining_time": "3:14:41"}
{"current_steps": 1000, "total_steps": 9132, "loss": 1.8323, "lr": 9.997360588415263e-06, "epoch": 0.10950803515207928, "percentage": 10.95, "elapsed_time": "0:23:38", "remaining_time": "3:12:17"}
{"current_steps": 1100, "total_steps": 9132, "loss": 1.8238, "lr": 9.987501154068591e-06, "epoch": 0.12045883866728721, "percentage": 12.05, "elapsed_time": "0:25:59", "remaining_time": "3:09:47"}
{"current_steps": 1200, "total_steps": 9132, "loss": 1.8213, "lr": 9.970353900512644e-06, "epoch": 0.13140964218249515, "percentage": 13.14, "elapsed_time": "0:28:19", "remaining_time": "3:07:11"}
{"current_steps": 1300, "total_steps": 9132, "loss": 1.8147, "lr": 9.945943883598031e-06, "epoch": 0.14236044569770306, "percentage": 14.24, "elapsed_time": "0:30:41", "remaining_time": "3:04:54"}
{"current_steps": 1400, "total_steps": 9132, "loss": 1.7824, "lr": 9.914306771645357e-06, "epoch": 0.153311249212911, "percentage": 15.33, "elapsed_time": "0:33:04", "remaining_time": "3:02:41"}
{"current_steps": 1500, "total_steps": 9132, "loss": 1.7896, "lr": 9.875488793326074e-06, "epoch": 0.16426205272811892, "percentage": 16.43, "elapsed_time": "0:35:25", "remaining_time": "3:00:13"}
{"current_steps": 1600, "total_steps": 9132, "loss": 1.7788, "lr": 9.82954667011238e-06, "epoch": 0.17521285624332686, "percentage": 17.52, "elapsed_time": "0:37:47", "remaining_time": "2:57:53"}
{"current_steps": 1700, "total_steps": 9132, "loss": 1.7894, "lr": 9.776547533394874e-06, "epoch": 0.18616365975853477, "percentage": 18.62, "elapsed_time": "0:40:09", "remaining_time": "2:55:31"}
{"current_steps": 1800, "total_steps": 9132, "loss": 1.752, "lr": 9.716568826389045e-06, "epoch": 0.1971144632737427, "percentage": 19.71, "elapsed_time": "0:42:32", "remaining_time": "2:53:16"}
{"current_steps": 1900, "total_steps": 9132, "loss": 1.7587, "lr": 9.649698190973977e-06, "epoch": 0.20806526678895063, "percentage": 20.81, "elapsed_time": "0:44:54", "remaining_time": "2:50:55"}
{"current_steps": 2000, "total_steps": 9132, "loss": 1.7648, "lr": 9.576033339628578e-06, "epoch": 0.21901607030415857, "percentage": 21.9, "elapsed_time": "0:47:14", "remaining_time": "2:48:28"}
{"current_steps": 2100, "total_steps": 9132, "loss": 1.7507, "lr": 9.495681912652486e-06, "epoch": 0.2299668738193665, "percentage": 23.0, "elapsed_time": "0:49:34", "remaining_time": "2:46:01"}
{"current_steps": 2200, "total_steps": 9132, "loss": 1.7628, "lr": 9.408761320880292e-06, "epoch": 0.24091767733457442, "percentage": 24.09, "elapsed_time": "0:51:56", "remaining_time": "2:43:41"}
{"current_steps": 2300, "total_steps": 9132, "loss": 1.7299, "lr": 9.315398574118876e-06, "epoch": 0.25186848084978236, "percentage": 25.19, "elapsed_time": "0:54:18", "remaining_time": "2:41:19"}
{"current_steps": 2400, "total_steps": 9132, "loss": 1.7188, "lr": 9.215730095558582e-06, "epoch": 0.2628192843649903, "percentage": 26.28, "elapsed_time": "0:56:38", "remaining_time": "2:38:51"}
{"current_steps": 2500, "total_steps": 9132, "loss": 1.7139, "lr": 9.10990152242939e-06, "epoch": 0.2737700878801982, "percentage": 27.38, "elapsed_time": "0:59:02", "remaining_time": "2:36:36"}
{"current_steps": 2600, "total_steps": 9132, "loss": 1.711, "lr": 8.998067493193395e-06, "epoch": 0.28472089139540613, "percentage": 28.47, "elapsed_time": "1:01:23", "remaining_time": "2:34:13"}
{"current_steps": 2700, "total_steps": 9132, "loss": 1.7143, "lr": 8.880391421584511e-06, "epoch": 0.29567169491061407, "percentage": 29.57, "elapsed_time": "1:03:43", "remaining_time": "2:31:49"}
{"current_steps": 2800, "total_steps": 9132, "loss": 1.693, "lr": 8.757045257825642e-06, "epoch": 0.306622498425822, "percentage": 30.66, "elapsed_time": "1:06:06", "remaining_time": "2:29:30"}
{"current_steps": 2900, "total_steps": 9132, "loss": 1.6915, "lr": 8.628209237372148e-06, "epoch": 0.31757330194102995, "percentage": 31.76, "elapsed_time": "1:08:29", "remaining_time": "2:27:11"}
{"current_steps": 3000, "total_steps": 9132, "loss": 1.6932, "lr": 8.494071617548831e-06, "epoch": 0.32852410545623784, "percentage": 32.85, "elapsed_time": "1:10:50", "remaining_time": "2:24:48"}
{"current_steps": 3100, "total_steps": 9132, "loss": 1.6522, "lr": 8.354828402465215e-06, "epoch": 0.3394749089714458, "percentage": 33.95, "elapsed_time": "1:13:10", "remaining_time": "2:22:22"}
{"current_steps": 3200, "total_steps": 9132, "loss": 1.6759, "lr": 8.210683056611086e-06, "epoch": 0.3504257124866537, "percentage": 35.04, "elapsed_time": "1:15:31", "remaining_time": "2:20:00"}
{"current_steps": 3300, "total_steps": 9132, "loss": 1.6584, "lr": 8.06184620755083e-06, "epoch": 0.36137651600186166, "percentage": 36.14, "elapsed_time": "1:17:52", "remaining_time": "2:17:37"}
{"current_steps": 3400, "total_steps": 9132, "loss": 1.6598, "lr": 7.90853533815094e-06, "epoch": 0.37232731951706954, "percentage": 37.23, "elapsed_time": "1:20:14", "remaining_time": "2:15:16"}
{"current_steps": 3500, "total_steps": 9132, "loss": 1.6602, "lr": 7.750974468790462e-06, "epoch": 0.3832781230322775, "percentage": 38.33, "elapsed_time": "1:22:34", "remaining_time": "2:12:53"}
{"current_steps": 3600, "total_steps": 9132, "loss": 1.6466, "lr": 7.589393830018696e-06, "epoch": 0.3942289265474854, "percentage": 39.42, "elapsed_time": "1:24:56", "remaining_time": "2:10:31"}
{"current_steps": 3700, "total_steps": 9132, "loss": 1.6247, "lr": 7.4240295261385205e-06, "epoch": 0.40517973006269337, "percentage": 40.52, "elapsed_time": "1:27:16", "remaining_time": "2:08:08"}
{"current_steps": 3800, "total_steps": 9132, "loss": 1.6204, "lr": 7.2551231902068775e-06, "epoch": 0.41613053357790125, "percentage": 41.61, "elapsed_time": "1:29:38", "remaining_time": "2:05:46"}
{"current_steps": 3900, "total_steps": 9132, "loss": 1.618, "lr": 7.082921630956545e-06, "epoch": 0.4270813370931092, "percentage": 42.71, "elapsed_time": "1:31:57", "remaining_time": "2:03:22"}
{"current_steps": 4000, "total_steps": 9132, "loss": 1.6237, "lr": 6.9076764721551385e-06, "epoch": 0.43803214060831713, "percentage": 43.8, "elapsed_time": "1:34:18", "remaining_time": "2:00:59"}
{"current_steps": 4100, "total_steps": 9132, "loss": 1.6185, "lr": 6.729643784928295e-06, "epoch": 0.4489829441235251, "percentage": 44.9, "elapsed_time": "1:36:40", "remaining_time": "1:58:38"}
{"current_steps": 4200, "total_steps": 9132, "loss": 1.6114, "lr": 6.549083713584314e-06, "epoch": 0.459933747638733, "percentage": 45.99, "elapsed_time": "1:38:59", "remaining_time": "1:56:14"}
{"current_steps": 4300, "total_steps": 9132, "loss": 1.6123, "lr": 6.366260095486977e-06, "epoch": 0.4708845511539409, "percentage": 47.09, "elapsed_time": "1:41:18", "remaining_time": "1:53:50"}
{"current_steps": 4400, "total_steps": 9132, "loss": 1.5628, "lr": 6.181440075532042e-06, "epoch": 0.48183535466914884, "percentage": 48.18, "elapsed_time": "1:43:40", "remaining_time": "1:51:30"}
{"current_steps": 4500, "total_steps": 9132, "loss": 1.5712, "lr": 5.99489371579069e-06, "epoch": 0.4927861581843568, "percentage": 49.28, "elapsed_time": "1:46:02", "remaining_time": "1:49:09"}
{"current_steps": 4600, "total_steps": 9132, "loss": 1.5599, "lr": 5.806893600890361e-06, "epoch": 0.5037369616995647, "percentage": 50.37, "elapsed_time": "1:48:22", "remaining_time": "1:46:46"}
{"current_steps": 4700, "total_steps": 9132, "loss": 1.5595, "lr": 5.617714439709588e-06, "epoch": 0.5146877652147727, "percentage": 51.47, "elapsed_time": "1:50:43", "remaining_time": "1:44:25"}
{"current_steps": 4800, "total_steps": 9132, "loss": 1.5747, "lr": 5.42763266396884e-06, "epoch": 0.5256385687299806, "percentage": 52.56, "elapsed_time": "1:53:05", "remaining_time": "1:42:04"}
{"current_steps": 4900, "total_steps": 9132, "loss": 1.5547, "lr": 5.236926024303909e-06, "epoch": 0.5365893722451885, "percentage": 53.66, "elapsed_time": "1:55:25", "remaining_time": "1:39:41"}
{"current_steps": 5000, "total_steps": 9132, "loss": 1.5846, "lr": 5.045873184412099e-06, "epoch": 0.5475401757603964, "percentage": 54.75, "elapsed_time": "1:57:44", "remaining_time": "1:37:18"}
{"current_steps": 5100, "total_steps": 9132, "loss": 1.5473, "lr": 4.854753313864212e-06, "epoch": 0.5584909792756043, "percentage": 55.85, "elapsed_time": "2:00:03", "remaining_time": "1:34:55"}
{"current_steps": 5200, "total_steps": 9132, "loss": 1.5513, "lr": 4.663845680177349e-06, "epoch": 0.5694417827908123, "percentage": 56.94, "elapsed_time": "2:02:26", "remaining_time": "1:32:34"}
{"current_steps": 5300, "total_steps": 9132, "loss": 1.5596, "lr": 4.473429240744606e-06, "epoch": 0.5803925863060202, "percentage": 58.04, "elapsed_time": "2:04:48", "remaining_time": "1:30:14"}
{"current_steps": 5400, "total_steps": 9132, "loss": 1.5334, "lr": 4.283782235217901e-06, "epoch": 0.5913433898212281, "percentage": 59.13, "elapsed_time": "2:07:10", "remaining_time": "1:27:53"}
{"current_steps": 5500, "total_steps": 9132, "loss": 1.5183, "lr": 4.095181778939598e-06, "epoch": 0.6022941933364361, "percentage": 60.23, "elapsed_time": "2:09:30", "remaining_time": "1:25:31"}
{"current_steps": 5600, "total_steps": 9132, "loss": 1.5402, "lr": 3.90790345801699e-06, "epoch": 0.613244996851644, "percentage": 61.32, "elapsed_time": "2:11:51", "remaining_time": "1:23:09"}
{"current_steps": 5700, "total_steps": 9132, "loss": 1.5132, "lr": 3.7222209266313026e-06, "epoch": 0.624195800366852, "percentage": 62.42, "elapsed_time": "2:14:14", "remaining_time": "1:20:49"}
{"current_steps": 5800, "total_steps": 9132, "loss": 1.5098, "lr": 3.538405507169692e-06, "epoch": 0.6351466038820599, "percentage": 63.51, "elapsed_time": "2:16:35", "remaining_time": "1:18:27"}
{"current_steps": 5900, "total_steps": 9132, "loss": 1.5147, "lr": 3.356725793764477e-06, "epoch": 0.6460974073972677, "percentage": 64.61, "elapsed_time": "2:18:55", "remaining_time": "1:16:06"}
{"current_steps": 6000, "total_steps": 9132, "loss": 1.5384, "lr": 3.1774472598189503e-06, "epoch": 0.6570482109124757, "percentage": 65.7, "elapsed_time": "2:21:17", "remaining_time": "1:13:45"}
{"current_steps": 6100, "total_steps": 9132, "loss": 1.5411, "lr": 3.0008318700932426e-06, "epoch": 0.6679990144276836, "percentage": 66.8, "elapsed_time": "2:23:38", "remaining_time": "1:11:23"}
{"current_steps": 6200, "total_steps": 9132, "loss": 1.5003, "lr": 2.827137697917096e-06, "epoch": 0.6789498179428916, "percentage": 67.89, "elapsed_time": "2:26:00", "remaining_time": "1:09:02"}
{"current_steps": 6300, "total_steps": 9132, "loss": 1.5175, "lr": 2.6566185480888276e-06, "epoch": 0.6899006214580995, "percentage": 68.99, "elapsed_time": "2:28:20", "remaining_time": "1:06:40"}
{"current_steps": 6400, "total_steps": 9132, "loss": 1.4974, "lr": 2.4895235860115652e-06, "epoch": 0.7008514249733074, "percentage": 70.08, "elapsed_time": "2:30:41", "remaining_time": "1:04:19"}
{"current_steps": 6500, "total_steps": 9132, "loss": 1.497, "lr": 2.326096973608648e-06, "epoch": 0.7118022284885154, "percentage": 71.18, "elapsed_time": "2:33:01", "remaining_time": "1:01:57"}
{"current_steps": 6600, "total_steps": 9132, "loss": 1.502, "lr": 2.166577512550162e-06, "epoch": 0.7227530320037233, "percentage": 72.27, "elapsed_time": "2:35:21", "remaining_time": "0:59:35"}
{"current_steps": 6700, "total_steps": 9132, "loss": 1.5173, "lr": 2.0111982953120073e-06, "epoch": 0.7337038355189311, "percentage": 73.37, "elapsed_time": "2:37:42", "remaining_time": "0:57:14"}
{"current_steps": 6800, "total_steps": 9132, "loss": 1.4877, "lr": 1.8601863645773128e-06, "epoch": 0.7446546390341391, "percentage": 74.46, "elapsed_time": "2:40:03", "remaining_time": "0:54:53"}
{"current_steps": 6900, "total_steps": 9132, "loss": 1.4705, "lr": 1.7137623814779036e-06, "epoch": 0.755605442549347, "percentage": 75.56, "elapsed_time": "2:42:24", "remaining_time": "0:52:31"}
{"current_steps": 7000, "total_steps": 9132, "loss": 1.4747, "lr": 1.5721403031606048e-06, "epoch": 0.766556246064555, "percentage": 76.65, "elapsed_time": "2:44:47", "remaining_time": "0:50:11"}
{"current_steps": 7100, "total_steps": 9132, "loss": 1.5005, "lr": 1.43552707014953e-06, "epoch": 0.7775070495797629, "percentage": 77.75, "elapsed_time": "2:47:10", "remaining_time": "0:47:50"}
{"current_steps": 7200, "total_steps": 9132, "loss": 1.5038, "lr": 1.3041223039611489e-06, "epoch": 0.7884578530949709, "percentage": 78.84, "elapsed_time": "2:49:33", "remaining_time": "0:45:29"}
{"current_steps": 7300, "total_steps": 9132, "loss": 1.5086, "lr": 1.1781180154140331e-06, "epoch": 0.7994086566101788, "percentage": 79.94, "elapsed_time": "2:51:54", "remaining_time": "0:43:08"}
{"current_steps": 7400, "total_steps": 9132, "loss": 1.4665, "lr": 1.057698324059469e-06, "epoch": 0.8103594601253867, "percentage": 81.03, "elapsed_time": "2:54:14", "remaining_time": "0:40:46"}
{"current_steps": 7500, "total_steps": 9132, "loss": 1.4686, "lr": 9.43039189142922e-07, "epoch": 0.8213102636405947, "percentage": 82.13, "elapsed_time": "2:56:32", "remaining_time": "0:38:25"}
{"current_steps": 7600, "total_steps": 9132, "loss": 1.4933, "lr": 8.343081524894763e-07, "epoch": 0.8322610671558025, "percentage": 83.22, "elapsed_time": "2:58:54", "remaining_time": "0:36:03"}
{"current_steps": 7700, "total_steps": 9132, "loss": 1.4976, "lr": 7.316640936889491e-07, "epoch": 0.8432118706710104, "percentage": 84.32, "elapsed_time": "3:01:15", "remaining_time": "0:33:42"}
{"current_steps": 7800, "total_steps": 9132, "loss": 1.4663, "lr": 6.352569979384027e-07, "epoch": 0.8541626741862184, "percentage": 85.41, "elapsed_time": "3:03:34", "remaining_time": "0:31:21"}
{"current_steps": 7900, "total_steps": 9132, "loss": 1.4635, "lr": 5.452277368812936e-07, "epoch": 0.8651134777014263, "percentage": 86.51, "elapsed_time": "3:05:55", "remaining_time": "0:28:59"}
{"current_steps": 8000, "total_steps": 9132, "loss": 1.4739, "lr": 4.617078627635019e-07, "epoch": 0.8760642812166343, "percentage": 87.6, "elapsed_time": "3:08:15", "remaining_time": "0:26:38"}
{"current_steps": 8100, "total_steps": 9132, "loss": 1.4525, "lr": 3.8481941620700127e-07, "epoch": 0.8870150847318422, "percentage": 88.7, "elapsed_time": "3:10:34", "remaining_time": "0:24:16"}
{"current_steps": 8200, "total_steps": 9132, "loss": 1.4467, "lr": 3.146747478820938e-07, "epoch": 0.8979658882470501, "percentage": 89.79, "elapsed_time": "3:12:54", "remaining_time": "0:21:55"}
{"current_steps": 8300, "total_steps": 9132, "loss": 1.4893, "lr": 2.513763543387465e-07, "epoch": 0.9089166917622581, "percentage": 90.89, "elapsed_time": "3:15:16", "remaining_time": "0:19:34"}
{"current_steps": 8400, "total_steps": 9132, "loss": 1.4246, "lr": 1.9501672823693584e-07, "epoch": 0.919867495277466, "percentage": 91.98, "elapsed_time": "3:17:35", "remaining_time": "0:17:13"}
{"current_steps": 8500, "total_steps": 9132, "loss": 1.456, "lr": 1.4567822319484614e-07, "epoch": 0.9308182987926739, "percentage": 93.08, "elapsed_time": "3:19:56", "remaining_time": "0:14:52"}
{"current_steps": 8600, "total_steps": 9132, "loss": 1.4473, "lr": 1.0343293345239702e-07, "epoch": 0.9417691023078818, "percentage": 94.17, "elapsed_time": "3:22:16", "remaining_time": "0:12:30"}
{"current_steps": 8700, "total_steps": 9132, "loss": 1.4813, "lr": 6.834258852594866e-08, "epoch": 0.9527199058230897, "percentage": 95.27, "elapsed_time": "3:24:36", "remaining_time": "0:10:09"}
{"current_steps": 8800, "total_steps": 9132, "loss": 1.4259, "lr": 4.045846300811229e-08, "epoch": 0.9636707093382977, "percentage": 96.36, "elapsed_time": "3:27:01", "remaining_time": "0:07:48"}
{"current_steps": 8900, "total_steps": 9132, "loss": 1.4595, "lr": 1.9821301644462056e-08, "epoch": 0.9746215128535056, "percentage": 97.46, "elapsed_time": "3:29:23", "remaining_time": "0:05:27"}
{"current_steps": 9000, "total_steps": 9132, "loss": 1.4601, "lr": 6.461259796644026e-09, "epoch": 0.9855723163687136, "percentage": 98.55, "elapsed_time": "3:31:43", "remaining_time": "0:03:06"}
{"current_steps": 9100, "total_steps": 9132, "loss": 1.4738, "lr": 3.978593788622753e-10, "epoch": 0.9965231198839215, "percentage": 99.65, "elapsed_time": "3:34:03", "remaining_time": "0:00:45"}
{"current_steps": 9132, "total_steps": 9132, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "3:35:30", "remaining_time": "0:00:00"}