Files
grpo-tool-sat-sft-qwen3-1p7…/trainer_log.jsonl
ModelHub XC c1b860e80a 初始化项目,由ModelHub XC社区提供模型
Model: raca-workspace-v1/grpo-tool-sat-sft-qwen3-1p7b-sft-20260419-075623-96e9
Source: Original Platform
2026-05-28 09:48:20 +08:00

42 lines
7.2 KiB
JSON

{"current_steps": 25, "total_steps": 1000, "loss": 2.3428, "lr": 1.6000000000000003e-05, "epoch": 0.05, "percentage": 2.5, "elapsed_time": "0:00:14", "remaining_time": "0:09:09"}
{"current_steps": 50, "total_steps": 1000, "loss": 0.7368, "lr": 1.998107236150145e-05, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:00:25", "remaining_time": "0:08:11"}
{"current_steps": 75, "total_steps": 1000, "loss": 0.5067, "lr": 1.989863301061654e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "0:00:37", "remaining_time": "0:07:44"}
{"current_steps": 100, "total_steps": 1000, "loss": 0.4279, "lr": 1.9751334064160708e-05, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:00:49", "remaining_time": "0:07:24"}
{"current_steps": 125, "total_steps": 1000, "loss": 0.419, "lr": 1.9540140680664915e-05, "epoch": 0.25, "percentage": 12.5, "elapsed_time": "0:01:01", "remaining_time": "0:07:08"}
{"current_steps": 150, "total_steps": 1000, "loss": 0.4207, "lr": 1.9266436679230866e-05, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "0:01:13", "remaining_time": "0:06:53"}
{"current_steps": 175, "total_steps": 1000, "loss": 0.4169, "lr": 1.8932015472223692e-05, "epoch": 0.35, "percentage": 17.5, "elapsed_time": "0:01:24", "remaining_time": "0:06:39"}
{"current_steps": 200, "total_steps": 1000, "loss": 0.4185, "lr": 1.8539068314154355e-05, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:01:36", "remaining_time": "0:06:26"}
{"current_steps": 225, "total_steps": 1000, "loss": 0.4197, "lr": 1.8090169943749477e-05, "epoch": 0.45, "percentage": 22.5, "elapsed_time": "0:01:48", "remaining_time": "0:06:13"}
{"current_steps": 250, "total_steps": 1000, "loss": 0.42, "lr": 1.758826171328727e-05, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "0:02:00", "remaining_time": "0:06:00"}
{"current_steps": 275, "total_steps": 1000, "loss": 0.4209, "lr": 1.7036632315742464e-05, "epoch": 0.55, "percentage": 27.5, "elapsed_time": "0:02:12", "remaining_time": "0:05:48"}
{"current_steps": 300, "total_steps": 1000, "loss": 0.4168, "lr": 1.6438896236023374e-05, "epoch": 0.6, "percentage": 30.0, "elapsed_time": "0:02:23", "remaining_time": "0:05:35"}
{"current_steps": 325, "total_steps": 1000, "loss": 0.4155, "lr": 1.57989700674967e-05, "epoch": 0.65, "percentage": 32.5, "elapsed_time": "0:02:35", "remaining_time": "0:05:23"}
{"current_steps": 350, "total_steps": 1000, "loss": 0.4171, "lr": 1.512104684898319e-05, "epoch": 0.7, "percentage": 35.0, "elapsed_time": "0:02:47", "remaining_time": "0:05:11"}
{"current_steps": 375, "total_steps": 1000, "loss": 0.4143, "lr": 1.4409568590377918e-05, "epoch": 0.75, "percentage": 37.5, "elapsed_time": "0:02:59", "remaining_time": "0:04:58"}
{"current_steps": 400, "total_steps": 1000, "loss": 0.4144, "lr": 1.3669197166917723e-05, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "0:03:11", "remaining_time": "0:04:46"}
{"current_steps": 425, "total_steps": 1000, "loss": 0.4152, "lr": 1.2904783772807534e-05, "epoch": 0.85, "percentage": 42.5, "elapsed_time": "0:03:23", "remaining_time": "0:04:34"}
{"current_steps": 450, "total_steps": 1000, "loss": 0.4161, "lr": 1.2121337134357121e-05, "epoch": 0.9, "percentage": 45.0, "elapsed_time": "0:03:34", "remaining_time": "0:04:22"}
{"current_steps": 475, "total_steps": 1000, "loss": 0.4154, "lr": 1.1323990690907734e-05, "epoch": 0.95, "percentage": 47.5, "elapsed_time": "0:03:46", "remaining_time": "0:04:10"}
{"current_steps": 500, "total_steps": 1000, "loss": 0.4142, "lr": 1.0517968958591705e-05, "epoch": 1.0, "percentage": 50.0, "elapsed_time": "0:03:58", "remaining_time": "0:03:58"}
{"current_steps": 525, "total_steps": 1000, "loss": 0.4138, "lr": 9.708553297322407e-06, "epoch": 1.05, "percentage": 52.5, "elapsed_time": "0:04:43", "remaining_time": "0:04:16"}
{"current_steps": 550, "total_steps": 1000, "loss": 0.4142, "lr": 8.901047305322172e-06, "epoch": 1.1, "percentage": 55.0, "elapsed_time": "0:04:55", "remaining_time": "0:04:01"}
{"current_steps": 575, "total_steps": 1000, "loss": 0.4138, "lr": 8.100742067936432e-06, "epoch": 1.15, "percentage": 57.5, "elapsed_time": "0:05:06", "remaining_time": "0:03:46"}
{"current_steps": 600, "total_steps": 1000, "loss": 0.4125, "lr": 7.312881488436928e-06, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "0:05:18", "remaining_time": "0:03:32"}
{"current_steps": 625, "total_steps": 1000, "loss": 0.4108, "lr": 6.542627927979772e-06, "epoch": 1.25, "percentage": 62.5, "elapsed_time": "0:05:30", "remaining_time": "0:03:18"}
{"current_steps": 650, "total_steps": 1000, "loss": 0.4112, "lr": 5.795028379858355e-06, "epoch": 1.3, "percentage": 65.0, "elapsed_time": "0:05:42", "remaining_time": "0:03:04"}
{"current_steps": 675, "total_steps": 1000, "loss": 0.413, "lr": 5.074981399690219e-06, "epoch": 1.35, "percentage": 67.5, "elapsed_time": "0:05:54", "remaining_time": "0:02:50"}
{"current_steps": 700, "total_steps": 1000, "loss": 0.4136, "lr": 4.3872050082238535e-06, "epoch": 1.4, "percentage": 70.0, "elapsed_time": "0:06:05", "remaining_time": "0:02:36"}
{"current_steps": 725, "total_steps": 1000, "loss": 0.4115, "lr": 3.736205777078381e-06, "epoch": 1.45, "percentage": 72.5, "elapsed_time": "0:06:17", "remaining_time": "0:02:23"}
{"current_steps": 750, "total_steps": 1000, "loss": 0.4125, "lr": 3.126249299978086e-06, "epoch": 1.5, "percentage": 75.0, "elapsed_time": "0:06:29", "remaining_time": "0:02:09"}
{"current_steps": 775, "total_steps": 1000, "loss": 0.4122, "lr": 2.5613322429654573e-06, "epoch": 1.55, "percentage": 77.5, "elapsed_time": "0:06:41", "remaining_time": "0:01:56"}
{"current_steps": 800, "total_steps": 1000, "loss": 0.412, "lr": 2.0451561567303378e-06, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "0:06:53", "remaining_time": "0:01:43"}
{"current_steps": 825, "total_steps": 1000, "loss": 0.4123, "lr": 1.5811032226467304e-06, "epoch": 1.65, "percentage": 82.5, "elapsed_time": "0:07:05", "remaining_time": "0:01:30"}
{"current_steps": 850, "total_steps": 1000, "loss": 0.4106, "lr": 1.1722140914384162e-06, "epoch": 1.7, "percentage": 85.0, "elapsed_time": "0:07:17", "remaining_time": "0:01:17"}
{"current_steps": 875, "total_steps": 1000, "loss": 0.4118, "lr": 8.211679596828481e-07, "epoch": 1.75, "percentage": 87.5, "elapsed_time": "0:07:28", "remaining_time": "0:01:04"}
{"current_steps": 900, "total_steps": 1000, "loss": 0.4125, "lr": 5.30265014699628e-07, "epoch": 1.8, "percentage": 90.0, "elapsed_time": "0:07:40", "remaining_time": "0:00:51"}
{"current_steps": 925, "total_steps": 1000, "loss": 0.4115, "lr": 3.0141136285129825e-07, "epoch": 1.85, "percentage": 92.5, "elapsed_time": "0:07:52", "remaining_time": "0:00:38"}
{"current_steps": 950, "total_steps": 1000, "loss": 0.4122, "lr": 1.361065400119399e-07, "epoch": 1.9, "percentage": 95.0, "elapsed_time": "0:08:04", "remaining_time": "0:00:25"}
{"current_steps": 975, "total_steps": 1000, "loss": 0.4112, "lr": 3.543368603973529e-08, "epoch": 1.95, "percentage": 97.5, "elapsed_time": "0:08:16", "remaining_time": "0:00:12"}
{"current_steps": 1000, "total_steps": 1000, "loss": 0.4103, "lr": 5.244763404133046e-11, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:08:28", "remaining_time": "0:00:00"}
{"current_steps": 1000, "total_steps": 1000, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:09:13", "remaining_time": "0:00:00"}