{ "achieved_tflops_per_gpu": 0.003765764673554456, "achieved_tflops_per_gpu_theoretical": 531.9010163632374, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.20184344053268433, "mfu_percent": 0.0002661317790497849, "mfu_percent_theoretical": 37.59017783485777, "total_flos": 1656860604825600.0, "train_loss": 0.3245428150801321, "train_runtime": 27498.7411, "train_samples_per_second": 2.513, "train_steps_per_second": 0.157, "valid_targets_mean": 6528.7, "valid_targets_min": 1969 }