Training in progress, epoch 5
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +29 -3
- pytorch_model.bin +1 -1
- runs/May01_10-03-26_b04f269e142e/events.out.tfevents.1682935412.b04f269e142e.1987.2 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 535707205
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0059e6dae5f33b5e8010668e556651f53091251119d4c2628aa3433d0b839efa
|
3 |
size 535707205
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267858605
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5405cb5b6ce21eb5c583d4207099b0ed90146c4bc9eedb041f788dbef65a324f
|
3 |
size 267858605
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14575
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:737b3f7378942c003b399c1debf88e00265db027e430af8039949bb4d1a2e421
|
3 |
size 14575
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9d9a9ff992b0fb831a129f7e4a4f8d53a6ea9bdde23aa729f8def96a545386e
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": 1.606531023979187,
|
3 |
"best_model_checkpoint": "distilbert_final_tweet_dataset_200_epoch/checkpoint-230",
|
4 |
-
"epoch":
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -36,11 +36,37 @@
|
|
36 |
"eval_samples_per_second": 450.123,
|
37 |
"eval_steps_per_second": 56.96,
|
38 |
"step": 345
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
39 |
}
|
40 |
],
|
41 |
"max_steps": 23000,
|
42 |
"num_train_epochs": 200,
|
43 |
-
"total_flos":
|
44 |
"trial_name": null,
|
45 |
"trial_params": null
|
46 |
}
|
|
|
1 |
{
|
2 |
"best_metric": 1.606531023979187,
|
3 |
"best_model_checkpoint": "distilbert_final_tweet_dataset_200_epoch/checkpoint-230",
|
4 |
+
"epoch": 5.0,
|
5 |
+
"global_step": 575,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
36 |
"eval_samples_per_second": 450.123,
|
37 |
"eval_steps_per_second": 56.96,
|
38 |
"step": 345
|
39 |
+
},
|
40 |
+
{
|
41 |
+
"epoch": 4.0,
|
42 |
+
"eval_accuracy": 0.6296296296296297,
|
43 |
+
"eval_f1": 0.6251138433515483,
|
44 |
+
"eval_loss": 2.2798941135406494,
|
45 |
+
"eval_runtime": 0.7194,
|
46 |
+
"eval_samples_per_second": 450.35,
|
47 |
+
"eval_steps_per_second": 56.989,
|
48 |
+
"step": 460
|
49 |
+
},
|
50 |
+
{
|
51 |
+
"epoch": 4.35,
|
52 |
+
"learning_rate": 4.891304347826087e-05,
|
53 |
+
"loss": 0.1025,
|
54 |
+
"step": 500
|
55 |
+
},
|
56 |
+
{
|
57 |
+
"epoch": 5.0,
|
58 |
+
"eval_accuracy": 0.6512345679012346,
|
59 |
+
"eval_f1": 0.6431049313635814,
|
60 |
+
"eval_loss": 2.6507568359375,
|
61 |
+
"eval_runtime": 0.7337,
|
62 |
+
"eval_samples_per_second": 441.574,
|
63 |
+
"eval_steps_per_second": 55.878,
|
64 |
+
"step": 575
|
65 |
}
|
66 |
],
|
67 |
"max_steps": 23000,
|
68 |
"num_train_epochs": 200,
|
69 |
+
"total_flos": 185563744734420.0,
|
70 |
"trial_name": null,
|
71 |
"trial_params": null
|
72 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 267858605
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5405cb5b6ce21eb5c583d4207099b0ed90146c4bc9eedb041f788dbef65a324f
|
3 |
size 267858605
|
runs/May01_10-03-26_b04f269e142e/events.out.tfevents.1682935412.b04f269e142e.1987.2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be44413331b6fc6ffa6df0c9de4d6a0381db5fbdfe3aaca05fbc1cf9a8c46d2d
|
3 |
+
size 6165
|