{ "achieved_tflops_per_gpu": 51242.27907434514, "achieved_tflops_per_gpu_theoretical": 1501156.7964550059, "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.0942406952381134, "mfu_percent": 3621.3624787523067, "mfu_percent_theoretical": 106088.81953745625, "total_flos": 3.756182037619278e+18, "train_loss": 0.0, "train_runtime": 2.2907, "train_samples_per_second": 42523.793, "train_steps_per_second": 443.093, "valid_targets_mean": 8724.4, "valid_targets_min": 2268 }