{ "achieved_tflops_per_gpu": 3.194680814635091, "achieved_tflops_per_gpu_theoretical": 291.35979240279244, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.3030981719493866, "mfu_percent": 0.32302131593883626, "mfu_percent_theoretical": 29.4600396767232, "total_flos": 1.299011914721919e+18, "train_loss": 0.3405153105383391, "train_runtime": 50827.1401, "train_samples_per_second": 1.373, "train_steps_per_second": 0.086, "valid_targets_mean": 4862.5, "valid_targets_min": 1479 }