28 lines
6.1 KiB
JSON
28 lines
6.1 KiB
JSON
{"current_steps": 1, "total_steps": 25, "loss": 0.2265, "lr": 0.0, "epoch": 0.21052631578947367, "percentage": 4.0, "elapsed_time": "0:00:20", "remaining_time": "0:08:19", "throughput": 4356.76, "total_tokens": 90632}
|
|
{"current_steps": 2, "total_steps": 25, "loss": 0.2547, "lr": 1.6666666666666667e-05, "epoch": 0.42105263157894735, "percentage": 8.0, "elapsed_time": "0:00:30", "remaining_time": "0:05:50", "throughput": 6026.62, "total_tokens": 183712}
|
|
{"current_steps": 3, "total_steps": 25, "loss": 0.2468, "lr": 3.3333333333333335e-05, "epoch": 0.631578947368421, "percentage": 12.0, "elapsed_time": "0:00:40", "remaining_time": "0:04:55", "throughput": 6895.2, "total_tokens": 277384}
|
|
{"current_steps": 4, "total_steps": 25, "loss": 0.238, "lr": 5e-05, "epoch": 0.8421052631578947, "percentage": 16.0, "elapsed_time": "0:00:50", "remaining_time": "0:04:24", "throughput": 7483.92, "total_tokens": 376672}
|
|
{"current_steps": 5, "total_steps": 25, "loss": 0.2939, "lr": 4.9745536047023324e-05, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "0:00:55", "remaining_time": "0:03:40", "throughput": 8137.68, "total_tokens": 448584}
|
|
{"current_steps": 6, "total_steps": 25, "loss": 0.3134, "lr": 4.898732434036244e-05, "epoch": 1.2105263157894737, "percentage": 24.0, "elapsed_time": "0:01:04", "remaining_time": "0:03:25", "throughput": 8345.8, "total_tokens": 541576}
|
|
{"current_steps": 7, "total_steps": 25, "loss": 0.2642, "lr": 4.774079988386296e-05, "epoch": 1.4210526315789473, "percentage": 28.0, "elapsed_time": "0:01:14", "remaining_time": "0:03:12", "throughput": 8536.64, "total_tokens": 637744}
|
|
{"current_steps": 8, "total_steps": 25, "loss": 0.2666, "lr": 4.6031338320779534e-05, "epoch": 1.631578947368421, "percentage": 32.0, "elapsed_time": "0:01:24", "remaining_time": "0:03:00", "throughput": 8627.7, "total_tokens": 732120}
|
|
{"current_steps": 9, "total_steps": 25, "loss": 0.2346, "lr": 4.389373935885646e-05, "epoch": 1.8421052631578947, "percentage": 36.0, "elapsed_time": "0:01:35", "remaining_time": "0:02:48", "throughput": 8768.67, "total_tokens": 833528}
|
|
{"current_steps": 10, "total_steps": 25, "loss": 0.251, "lr": 4.137151834863213e-05, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "0:01:43", "remaining_time": "0:02:34", "throughput": 8696.01, "total_tokens": 897168}
|
|
{"current_steps": 11, "total_steps": 25, "loss": 0.2168, "lr": 3.851602043638994e-05, "epoch": 2.2105263157894735, "percentage": 44.0, "elapsed_time": "0:01:52", "remaining_time": "0:02:23", "throughput": 8826.85, "total_tokens": 993464}
|
|
{"current_steps": 12, "total_steps": 25, "loss": 0.1636, "lr": 3.5385375325047166e-05, "epoch": 2.4210526315789473, "percentage": 48.0, "elapsed_time": "0:02:02", "remaining_time": "0:02:12", "throughput": 8935.83, "total_tokens": 1092872}
|
|
{"current_steps": 13, "total_steps": 25, "loss": 0.1882, "lr": 3.2043313921035743e-05, "epoch": 2.6315789473684212, "percentage": 52.0, "elapsed_time": "0:02:12", "remaining_time": "0:02:02", "throughput": 8984.4, "total_tokens": 1188144}
|
|
{"current_steps": 14, "total_steps": 25, "loss": 0.161, "lr": 2.8557870956832132e-05, "epoch": 2.8421052631578947, "percentage": 56.0, "elapsed_time": "0:02:22", "remaining_time": "0:01:51", "throughput": 9062.46, "total_tokens": 1287152}
|
|
{"current_steps": 15, "total_steps": 25, "loss": 0.2328, "lr": 2.5e-05, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "0:02:29", "remaining_time": "0:01:39", "throughput": 8985.51, "total_tokens": 1345752}
|
|
{"current_steps": 16, "total_steps": 25, "loss": 0.1513, "lr": 2.1442129043167874e-05, "epoch": 3.2105263157894735, "percentage": 64.0, "elapsed_time": "0:02:39", "remaining_time": "0:01:29", "throughput": 9008.43, "total_tokens": 1438888}
|
|
{"current_steps": 17, "total_steps": 25, "loss": 0.1159, "lr": 1.795668607896426e-05, "epoch": 3.4210526315789473, "percentage": 68.0, "elapsed_time": "0:02:49", "remaining_time": "0:01:19", "throughput": 9062.9, "total_tokens": 1535160}
|
|
{"current_steps": 18, "total_steps": 25, "loss": 0.1408, "lr": 1.4614624674952842e-05, "epoch": 3.6315789473684212, "percentage": 72.0, "elapsed_time": "0:02:59", "remaining_time": "0:01:09", "throughput": 9097.47, "total_tokens": 1629952}
|
|
{"current_steps": 19, "total_steps": 25, "loss": 0.1207, "lr": 1.148397956361007e-05, "epoch": 3.8421052631578947, "percentage": 76.0, "elapsed_time": "0:03:08", "remaining_time": "0:00:59", "throughput": 9149.6, "total_tokens": 1729264}
|
|
{"current_steps": 20, "total_steps": 25, "loss": 0.1767, "lr": 8.628481651367876e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "0:03:16", "remaining_time": "0:00:49", "throughput": 9117.89, "total_tokens": 1794336}
|
|
{"current_steps": 21, "total_steps": 25, "loss": 0.0917, "lr": 6.106260641143546e-06, "epoch": 4.2105263157894735, "percentage": 84.0, "elapsed_time": "0:03:26", "remaining_time": "0:00:39", "throughput": 9170.0, "total_tokens": 1893760}
|
|
{"current_steps": 22, "total_steps": 25, "loss": 0.1139, "lr": 3.968661679220468e-06, "epoch": 4.421052631578947, "percentage": 88.0, "elapsed_time": "0:03:35", "remaining_time": "0:00:29", "throughput": 9184.22, "total_tokens": 1981256}
|
|
{"current_steps": 23, "total_steps": 25, "loss": 0.1306, "lr": 2.2592001161370392e-06, "epoch": 4.631578947368421, "percentage": 92.0, "elapsed_time": "0:03:45", "remaining_time": "0:00:19", "throughput": 9212.38, "total_tokens": 2077800}
|
|
{"current_steps": 24, "total_steps": 25, "loss": 0.133, "lr": 1.0126756596375686e-06, "epoch": 4.842105263157895, "percentage": 96.0, "elapsed_time": "0:03:55", "remaining_time": "0:00:09", "throughput": 9229.22, "total_tokens": 2170328}
|
|
{"current_steps": 25, "total_steps": 25, "loss": 0.1053, "lr": 2.544639529766829e-07, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:03:59", "remaining_time": "0:00:00", "throughput": 9362.79, "total_tokens": 2242920}
|
|
{"current_steps": 25, "total_steps": 25, "eval_loss": 0.16564106941223145, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:04:00", "remaining_time": "0:00:00", "throughput": 9339.71, "total_tokens": 2242920}
|
|
{"current_steps": 25, "total_steps": 25, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:05:53", "remaining_time": "0:00:00", "throughput": 6341.17, "total_tokens": 2242920}
|