{ "achieved_tflops_per_gpu": 4.8979905652577145, "achieved_tflops_per_gpu_theoretical": 274.4202695886766, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1307346224784851, "mfu_percent": 0.4952467710068468, "mfu_percent_theoretical": 27.74724667226255, "total_flos": 2.2423052373794488e+18, "train_loss": 0.2677417782024403, "train_runtime": 57225.1316, "train_samples_per_second": 1.294, "train_steps_per_second": 0.081, "valid_targets_mean": 5411.9, "valid_targets_min": 3923 }