{ "epoch": 0.998003992015968, "total_flos": 8.741444925364634e+16, "train_loss": 1.2971151485443115, "train_runtime": 891.5874, "train_samples": 42336, "train_samples_per_second": 17.966, "train_steps_per_second": 0.28 }