{ "achieved_tflops_per_gpu": 3.754126430475683, "achieved_tflops_per_gpu_theoretical": 233.76541483479863, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.022832343354821205, "mfu_percent": 0.2653092883728398, "mfu_percent_theoretical": 16.520524016593544, "total_flos": 4.836413774367818e+18, "train_loss": 0.19618723029549, "train_runtime": 26839.4318, "train_samples_per_second": 6.577, "train_steps_per_second": 0.069, "valid_targets_mean": 5367.0, "valid_targets_min": 1264 }