{ "achieved_tflops_per_gpu": 14260.634490252658, "achieved_tflops_per_gpu_theoretical": 285996.7394798434, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.11673309653997421, "mfu_percent": 1007.8186918906473, "mfu_percent_theoretical": 20211.783708822855, "total_flos": 3.783973798181601e+17, "train_loss": 0.0, "train_runtime": 0.8292, "train_samples_per_second": 8061.816, "train_steps_per_second": 84.417, "valid_targets_mean": 6721.8, "valid_targets_min": 2351 }