{ "epoch": 2.0, "total_flos": 957358891008.0, "train_loss": 0.20337393274982868, "train_runtime": 258.6726, "train_samples_per_second": 12.688, "train_steps_per_second": 1.593 }