{ | |
"epoch": 0.9999493031929397, | |
"eval_loss": 1.1684964895248413, | |
"eval_runtime": 428.841, | |
"eval_samples": 14447, | |
"eval_samples_per_second": 33.688, | |
"eval_steps_per_second": 8.423, | |
"perplexity": 3.2171519787488077, | |
"total_flos": 5.643098158163558e+18, | |
"train_loss": 1.2418534558435956, | |
"train_runtime": 283616.7229, | |
"train_samples": 2919315, | |
"train_samples_per_second": 10.293, | |
"train_steps_per_second": 0.04 | |
} |