{ "achieved_tflops_per_gpu": 0.0028551198494507035, "achieved_tflops_per_gpu_theoretical": 643.7018669364019, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.16112969815731049, "mfu_percent": 0.00020177525437814158, "mfu_percent_theoretical": 45.49129801670684, "total_flos": 1028685735067648.0, "train_loss": 0.2310619655023648, "train_runtime": 22518.4447, "train_samples_per_second": 3.037, "train_steps_per_second": 0.19, "valid_targets_mean": 4178.8, "valid_targets_min": 1139 }