{ "epoch": 0.9975786924939467, "total_flos": 7.598970652485222e+16, "train_loss": 1.8085910475369795, "train_runtime": 916.9479, "train_samples": 42336, "train_samples_per_second": 14.402, "train_steps_per_second": 0.225 }