{ "achieved_tflops_per_gpu": 5.311919514959495, "achieved_tflops_per_gpu_theoretical": 223.6017011463291, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.21145598590373993, "mfu_percent": 0.5371000520687053, "mfu_percent_theoretical": 22.608867658880598, "total_flos": 2.8947179058078024e+18, "train_loss": 0.26257057309707904, "train_runtime": 68118.4527, "train_samples_per_second": 1.048, "train_steps_per_second": 0.066, "valid_targets_mean": 4636.9, "valid_targets_min": 581 }