{ "achieved_tflops_per_gpu": 0.00438470084781371, "achieved_tflops_per_gpu_theoretical": 640.3139623735788, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1386960744857788, "mfu_percent": 0.0003098728514355979, "mfu_percent_theoretical": 45.25187013240839, "total_flos": 1630450968166400.0, "train_loss": 0.1932186623672386, "train_runtime": 23240.6244, "train_samples_per_second": 3.017, "train_steps_per_second": 0.189, "valid_targets_mean": 4301.4, "valid_targets_min": 221 }