{ "achieved_tflops_per_gpu": 3.1038048161400233, "achieved_tflops_per_gpu_theoretical": 271.03236502585344, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.054979901760816574, "mfu_percent": 0.2193501636848073, "mfu_percent_theoretical": 19.154230743876568, "total_flos": 9.529203217976525e+16, "train_loss": 0.15973503326440786, "train_runtime": 959.4276, "train_samples_per_second": 7.296, "train_steps_per_second": 0.08, "valid_targets_mean": 4215.4, "valid_targets_min": 1870 }