{ "achieved_tflops_per_gpu": 4.937536133249764, "achieved_tflops_per_gpu_theoretical": 226.98960570915227, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.08761073648929596, "mfu_percent": 0.4992453117542734, "mfu_percent_theoretical": 22.951426259772727, "total_flos": 2.474107676200534e+18, "train_loss": 0.24594933182050951, "train_runtime": 62635.179, "train_samples_per_second": 1.069, "train_steps_per_second": 0.067, "valid_targets_mean": 11621.8, "valid_targets_min": 3550 }