{ "achieved_tflops_per_gpu": 10416.903675332684, "achieved_tflops_per_gpu_theoretical": 300700.2452824959, "epoch": 7.0, "mfu_percent": 736.1769381860554, "mfu_percent_theoretical": 21250.900726678155, "total_flos": 2.891732460272353e+17, "train_loss": 0.0, "train_runtime": 0.8675, "train_samples_per_second": 8068.811, "train_steps_per_second": 88.757 }