Files
g1_subagent_e1_gpt_long_tacc/train_results.json

16 lines
544 B
JSON
Raw Permalink Normal View History

{
"achieved_tflops_per_gpu": 0.003765764673554456,
"achieved_tflops_per_gpu_theoretical": 531.9010163632374,
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20184344053268433,
"mfu_percent": 0.0002661317790497849,
"mfu_percent_theoretical": 37.59017783485777,
"total_flos": 1656860604825600.0,
"train_loss": 0.3245428150801321,
"train_runtime": 27498.7411,
"train_samples_per_second": 2.513,
"train_steps_per_second": 0.157,
"valid_targets_mean": 6528.7,
"valid_targets_min": 1969
}