{ | |
"epoch": 3.0, | |
"eval_accuracy": 0.6942843185148998, | |
"eval_loss": 1.6576473712921143, | |
"eval_runtime": 2.7252, | |
"eval_samples": 10, | |
"eval_samples_per_second": 3.669, | |
"eval_steps_per_second": 0.367, | |
"perplexity": 5.246952182142712, | |
"total_flos": 1601895923712000.0, | |
"train_loss": 1.7650197347005208, | |
"train_runtime": 162.5074, | |
"train_samples": 1000, | |
"train_samples_per_second": 18.461, | |
"train_steps_per_second": 0.591 | |
} |