{ "achieved_tflops_per_gpu": 0.0031050564450395435, "achieved_tflops_per_gpu_theoretical": 501.4098752978288, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.23596960306167603, "mfu_percent": 0.00021943861802399602, "mfu_percent_theoretical": 35.43532687617165, "total_flos": 1290449162534912.0, "train_loss": 0.2838498419017905, "train_runtime": 25974.7525, "train_samples_per_second": 2.373, "train_steps_per_second": 0.148, "valid_targets_mean": 3951.1, "valid_targets_min": 1262 }