{ "achieved_tflops_per_gpu": 134266.39948678762, "achieved_tflops_per_gpu_theoretical": 3485791.289356818, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.4433520436286926, "mfu_percent": 9488.791483165203, "mfu_percent_theoretical": 246345.67415949245, "total_flos": 5.319956987025293e+18, "train_loss": 0.0, "train_runtime": 1.2382, "train_samples_per_second": 98264.932, "train_steps_per_second": 1028.893, "valid_targets_mean": 9841.1, "valid_targets_min": 3598 }