End of training
Browse files- all_results.json +6 -6
- eval_results.json +3 -3
- train_results.json +3 -3
- trainer_state.json +3 -3
all_results.json
CHANGED
@@ -1,11 +1,11 @@
|
|
1 |
{
|
2 |
"epoch": 0.04,
|
3 |
"eval_loss": 0.07713703066110611,
|
4 |
-
"eval_runtime":
|
5 |
-
"eval_samples_per_second":
|
6 |
-
"eval_steps_per_second":
|
7 |
"train_loss": 0.0033295607640092873,
|
8 |
-
"train_runtime":
|
9 |
-
"train_samples_per_second":
|
10 |
-
"train_steps_per_second":
|
11 |
}
|
|
|
1 |
{
|
2 |
"epoch": 0.04,
|
3 |
"eval_loss": 0.07713703066110611,
|
4 |
+
"eval_runtime": 761.1334,
|
5 |
+
"eval_samples_per_second": 50.911,
|
6 |
+
"eval_steps_per_second": 6.364,
|
7 |
"train_loss": 0.0033295607640092873,
|
8 |
+
"train_runtime": 303.4327,
|
9 |
+
"train_samples_per_second": 386.099,
|
10 |
+
"train_steps_per_second": 48.264
|
11 |
}
|
eval_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 0.04,
|
3 |
"eval_loss": 0.07713703066110611,
|
4 |
-
"eval_runtime":
|
5 |
-
"eval_samples_per_second":
|
6 |
-
"eval_steps_per_second":
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 0.04,
|
3 |
"eval_loss": 0.07713703066110611,
|
4 |
+
"eval_runtime": 761.1334,
|
5 |
+
"eval_samples_per_second": 50.911,
|
6 |
+
"eval_steps_per_second": 6.364
|
7 |
}
|
train_results.json
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
{
|
2 |
"epoch": 0.04,
|
3 |
"train_loss": 0.0033295607640092873,
|
4 |
-
"train_runtime":
|
5 |
-
"train_samples_per_second":
|
6 |
-
"train_steps_per_second":
|
7 |
}
|
|
|
1 |
{
|
2 |
"epoch": 0.04,
|
3 |
"train_loss": 0.0033295607640092873,
|
4 |
+
"train_runtime": 303.4327,
|
5 |
+
"train_samples_per_second": 386.099,
|
6 |
+
"train_steps_per_second": 48.264
|
7 |
}
|
trainer_state.json
CHANGED
@@ -208,9 +208,9 @@
|
|
208 |
"step": 14645,
|
209 |
"total_flos": 7.904602466056929e+18,
|
210 |
"train_loss": 0.0033295607640092873,
|
211 |
-
"train_runtime":
|
212 |
-
"train_samples_per_second":
|
213 |
-
"train_steps_per_second":
|
214 |
}
|
215 |
],
|
216 |
"max_steps": 14645,
|
|
|
208 |
"step": 14645,
|
209 |
"total_flos": 7.904602466056929e+18,
|
210 |
"train_loss": 0.0033295607640092873,
|
211 |
+
"train_runtime": 303.4327,
|
212 |
+
"train_samples_per_second": 386.099,
|
213 |
+
"train_steps_per_second": 48.264
|
214 |
}
|
215 |
],
|
216 |
"max_steps": 14645,
|