{ "achieved_tflops_per_gpu": 97.75913810098812, "achieved_tflops_per_gpu_theoretical": 1419.5320118229072, "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.018921401351690292, "mfu_percent": 6.908773010670539, "mfu_percent_theoretical": 100.3202835210535, "total_flos": 3.8872733453226344e+19, "train_loss": 0.0035894543761941615, "train_runtime": 12426.1828, "train_samples_per_second": 40.238, "train_steps_per_second": 0.419, "valid_targets_mean": 8871.3, "valid_targets_min": 2185 }