{ "achieved_tflops_per_gpu": 0.0030214454931977936, "achieved_tflops_per_gpu_theoretical": 498.0219707350057, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.11442745476961136, "mfu_percent": 0.00021352971683376632, "mfu_percent_theoretical": 35.1958989918732, "total_flos": 1222766426718208.0, "train_loss": 0.19705863873869428, "train_runtime": 25293.4901, "train_samples_per_second": 2.35, "train_steps_per_second": 0.147, "valid_targets_mean": 7264.7, "valid_targets_min": 669 }