{ | |
"epoch": 0.010905601116733554, | |
"eval_accuracy": 0.7869404549281535, | |
"eval_loss": 0.8759388327598572, | |
"eval_runtime": 249.4157, | |
"eval_samples": 5564, | |
"eval_samples_per_second": 22.308, | |
"eval_steps_per_second": 0.088, | |
"perplexity": 2.4011284942034856, | |
"total_flos": 1.3069163715939533e+18, | |
"train_loss": 1.3858390502929687, | |
"train_runtime": 13072.5982, | |
"train_samples": 5868487, | |
"train_samples_per_second": 1346.745, | |
"train_steps_per_second": 21.043 | |
} |