{ "achieved_tflops_per_gpu": 51242.27907434514, "achieved_tflops_per_gpu_theoretical": 1501156.7964550059, "epoch": 5.0, "mfu_percent": 3621.3624787523067, "mfu_percent_theoretical": 106088.81953745625, "total_flos": 3.756182037619278e+18, "train_loss": 0.0, "train_runtime": 2.2907, "train_samples_per_second": 42523.793, "train_steps_per_second": 443.093 }