{ "achieved_tflops_per_gpu": 3.2314190492736135, "achieved_tflops_per_gpu_theoretical": 315.0751243425546, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.27547487616539, "mfu_percent": 0.3267360009376758, "mfu_percent_theoretical": 31.857949882968107, "total_flos": 1.228481933579649e+18, "train_loss": 0.32828609189208674, "train_runtime": 47520.9929, "train_samples_per_second": 1.483, "train_steps_per_second": 0.093, "valid_targets_mean": 5897.4, "valid_targets_min": 1500 }