{ "epoch": 92.0, "learning_rate": 1.0000000000000002e-06, "total_flos": 1.1890234809282512e+21, "train_loss": 0.1360613288991788, "train_runtime": 194834.2342, "train_samples_per_second": 6.71, "train_steps_per_second": 0.21 }