{ "achieved_tflops_per_gpu": 0.0003518731812688662, "achieved_tflops_per_gpu_theoretical": 1439.8594391998463, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.3174639642238617, "mfu_percent": 2.4867362633842135e-05, "mfu_percent_theoretical": 101.75685082684426, "total_flos": 22338300149760.0, "train_loss": 0.652452801803053, "train_runtime": 3967.747, "train_samples_per_second": 6.796, "train_steps_per_second": 0.425, "valid_targets_mean": 94.8, "valid_targets_min": 62 }