{ "epoch": 100.0, "eval_loss": 0.036083951592445374, "eval_runtime": 0.5261, "eval_samples_per_second": 115.958, "eval_steps_per_second": 7.604, "total_flos": 4353076050246000.0, "train_loss": 0.7646091413497925, "train_runtime": 498.9098, "train_samples_per_second": 48.506, "train_steps_per_second": 1.603 }