{ "achieved_tflops_per_gpu": 0.00364986281178115, "achieved_tflops_per_gpu_theoretical": 626.7623441222861, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.14995810389518738, "mfu_percent": 0.0002579408347548516, "mfu_percent_theoretical": 44.29415859521456, "total_flos": 1254621303865344.0, "train_loss": 0.1876786600655953, "train_runtime": 21484.049, "train_samples_per_second": 2.956, "train_steps_per_second": 0.185, "valid_targets_mean": 5724.8, "valid_targets_min": 613 }