{ "achieved_tflops_per_gpu": 5.7291596130922695, "achieved_tflops_per_gpu_theoretical": 250.7049376489144, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.2848636209964752, "mfu_percent": 0.5792881307474489, "mfu_percent_theoretical": 25.349336466017636, "total_flos": 2.2384198545393582e+18, "train_loss": 0.3086844535421305, "train_runtime": 48838.3115, "train_samples_per_second": 1.177, "train_steps_per_second": 0.074, "valid_targets_mean": 4286.8, "valid_targets_min": 2135 }