{ "achieved_tflops_per_gpu": 0.003694895775092794, "achieved_tflops_per_gpu_theoretical": 738.5631946954506, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1528853178024292, "mfu_percent": 0.0002611233763316462, "mfu_percent_theoretical": 52.19527877706365, "total_flos": 1136028581756928.0, "train_loss": 0.1835220243889308, "train_runtime": 19216.1811, "train_samples_per_second": 3.487, "train_steps_per_second": 0.218, "valid_targets_mean": 3614.8, "valid_targets_min": 1526 }