{ "achieved_tflops_per_gpu": 3.398471531074522, "achieved_tflops_per_gpu_theoretical": 352.34207453360943, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.15736517310142517, "mfu_percent": 0.3436270506647646, "mfu_percent_theoretical": 35.62609449278154, "total_flos": 1.1754390626437693e+18, "train_loss": 0.32822010551712344, "train_runtime": 43234.1073, "train_samples_per_second": 1.657, "train_steps_per_second": 0.104, "valid_targets_mean": 3889.8, "valid_targets_min": 1146 }