{ "achieved_tflops_per_gpu": 0.003795708713251058, "achieved_tflops_per_gpu_theoretical": 616.5986304338165, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.16770605742931366, "mfu_percent": 0.0002682479656007815, "mfu_percent_theoretical": 43.57587494231919, "total_flos": 1289437200777216.0, "train_loss": 0.300232849066697, "train_runtime": 21231.8255, "train_samples_per_second": 2.904, "train_steps_per_second": 0.182, "valid_targets_mean": 4371.8, "valid_targets_min": 996 }