{ "achieved_tflops_per_gpu": 839.4888333380325, "achieved_tflops_per_gpu_theoretical": 251879765.55876052, "epoch": 6.18641975308642, "mfu_percent": 59.32783274473727, "mfu_percent_theoretical": 17800690.145495445, "total_flos": 3.2973778191384576e+16, "train_loss": 0.0, "train_runtime": 0.8183, "train_samples_per_second": 13858.168, "train_steps_per_second": 6929.084 }