{ "achieved_tflops_per_gpu": 0.0023249012759657254, "achieved_tflops_per_gpu_theoretical": 514.9614935491215, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.23076336085796356, "mfu_percent": 0.00016430397710005126, "mfu_percent_theoretical": 36.39303841336548, "total_flos": 1056573424926720.0, "train_loss": 0.349568347366189, "train_runtime": 28403.7175, "train_samples_per_second": 2.431, "train_steps_per_second": 0.152, "valid_targets_mean": 5247.5, "valid_targets_min": 1276 }