{ "epoch": 1.0, "eval_loss": 1.6678621768951416, "eval_runtime": 44.6818, "eval_samples_per_second": 78.981, "eval_steps_per_second": 9.892, "perplexity": 5.300823452549077, "total_flos": 2.016828552422359e+17, "train_loss": 3.3373708904914134, "train_runtime": 461.7028, "train_samples_per_second": 29.374, "train_steps_per_second": 3.673 }