{ "achieved_tflops_per_gpu": 0.005586118843879391, "achieved_tflops_per_gpu_theoretical": 745.339003821097, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.23579511046409607, "mfu_percent": 0.00039477871688193574, "mfu_percent_theoretical": 52.674134545660564, "total_flos": 1774371357458432.0, "train_loss": 0.271993322290693, "train_runtime": 19852.4616, "train_samples_per_second": 3.526, "train_steps_per_second": 0.22, "valid_targets_mean": 5026.7, "valid_targets_min": 4563 }