{ "achieved_tflops_per_gpu": 0.007574653146635192, "achieved_tflops_per_gpu_theoretical": 1114.6206011688223, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.13213281333446503, "mfu_percent": 0.0005353111764406496, "mfu_percent_theoretical": 78.7717739341924, "total_flos": 1596873627009024.0, "train_loss": 0.09127889497572297, "train_runtime": 13176.1283, "train_samples_per_second": 5.26, "train_steps_per_second": 0.329, "valid_targets_mean": 5086.1, "valid_targets_min": 2015 }