Training in progress, epoch 29
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +23 -3
- pytorch_model.bin +1 -1
- runs/May01_10-03-26_b04f269e142e/events.out.tfevents.1682935412.b04f269e142e.1987.2 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 535707205
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:408026f6a6387da59bc103ec5c9bf59663bfa4ac88f11705546f5292730bb56c
|
3 |
size 535707205
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267858605
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61843b369fadbf2a6a9e2852c7b3eb1a79dd2647f244cc7c1f5923b451d0cddb
|
3 |
size 267858605
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1781283e2d2196fb143e1e7f022e45333891363a4afbce2de165d310586248ac
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b08bd8b313e48a9bc73431af12c3c84b3dfb983234faac375a28f9023989c4f0
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 1.606531023979187,
|
3 |
"best_model_checkpoint": "distilbert_final_tweet_dataset_200_epoch/checkpoint-230",
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -312,11 +312,31 @@
|
|
312 |
"eval_samples_per_second": 434.183,
|
313 |
"eval_steps_per_second": 54.943,
|
314 |
"step": 3105
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
315 |
}
|
316 |
],
|
317 |
"max_steps": 23000,
|
318 |
"num_train_epochs": 200,
|
319 |
-
"total_flos":
|
320 |
"trial_name": null,
|
321 |
"trial_params": null
|
322 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 1.606531023979187,
|
3 |
"best_model_checkpoint": "distilbert_final_tweet_dataset_200_epoch/checkpoint-230",
|
4 |
+
"epoch": 29.0,
|
5 |
+
"global_step": 3335,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
312 |
"eval_samples_per_second": 434.183,
|
313 |
"eval_steps_per_second": 54.943,
|
314 |
"step": 3105
|
315 |
+
},
|
316 |
+
{
|
317 |
+
"epoch": 28.0,
|
318 |
+
"eval_accuracy": 0.6512345679012346,
|
319 |
+
"eval_f1": 0.646016361656172,
|
320 |
+
"eval_loss": 2.600759267807007,
|
321 |
+
"eval_runtime": 0.754,
|
322 |
+
"eval_samples_per_second": 429.696,
|
323 |
+
"eval_steps_per_second": 54.375,
|
324 |
+
"step": 3220
|
325 |
+
},
|
326 |
+
{
|
327 |
+
"epoch": 29.0,
|
328 |
+
"eval_accuracy": 0.6759259259259259,
|
329 |
+
"eval_f1": 0.6760610574156681,
|
330 |
+
"eval_loss": 2.3673853874206543,
|
331 |
+
"eval_runtime": 0.7318,
|
332 |
+
"eval_samples_per_second": 442.773,
|
333 |
+
"eval_steps_per_second": 56.03,
|
334 |
+
"step": 3335
|
335 |
}
|
336 |
],
|
337 |
"max_steps": 23000,
|
338 |
"num_train_epochs": 200,
|
339 |
+
"total_flos": 1076269719459636.0,
|
340 |
"trial_name": null,
|
341 |
"trial_params": null
|
342 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267858605
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61843b369fadbf2a6a9e2852c7b3eb1a79dd2647f244cc7c1f5923b451d0cddb
|
3 |
size 267858605
|
runs/May01_10-03-26_b04f269e142e/events.out.tfevents.1682935412.b04f269e142e.1987.2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ebe6a7096c66aaaddb45d91019405033609cc8fc1ed7bb7c1ade99f30192a33e
|
3 |
+
size 15806
|