{ "achieved_tflops_per_gpu": 0.002376715033316625, "achieved_tflops_per_gpu_theoretical": 403.160642975957, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.3035658001899719, "mfu_percent": 0.00016796572673615724, "mfu_percent_theoretical": 28.491918231516397, "total_flos": 1381541515886592.0, "train_loss": 0.3652997003221998, "train_runtime": 36330.121, "train_samples_per_second": 1.899, "train_steps_per_second": 0.119, "valid_targets_mean": 8644.1, "valid_targets_min": 705 }