{ "epoch": 3.0, "eval_loss": 1.6106535196304321, "eval_runtime": 8.342, "eval_samples_per_second": 45.672, "eval_steps_per_second": 11.508, "perplexity": 5.006081731731173, "total_flos": 1.0283028491985224e+19, "train_loss": 1.6124080855326697, "train_runtime": 7405.1369, "train_samples_per_second": 15.277, "train_steps_per_second": 0.478 }