{ "achieved_tflops_per_gpu": 0.002924690961750274, "achieved_tflops_per_gpu_theoretical": 538.6768254888838, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.25932279229164124, "mfu_percent": 0.00020669194075973666, "mfu_percent_theoretical": 38.069033603454685, "total_flos": 1114110277320704.0, "train_loss": 0.27588593444180864, "train_runtime": 23808.2906, "train_samples_per_second": 2.54, "train_steps_per_second": 0.159, "valid_targets_mean": 5070.4, "valid_targets_min": 1372 }