player1537
commited on
Commit
•
929ef79
1
Parent(s):
168739b
Training in progress, step 22044
Browse files- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/pytorch_model.bin +1 -1
- last-checkpoint/rng_state.pth +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +9 -3
- pytorch_model.bin +1 -1
- runs/Jun04_02-06-39_4367d7224c9f/events.out.tfevents.1685845095.4367d7224c9f.857.0 +2 -2
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6319689
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6647666f8d0fc534fb821dd4acb02c87203056a403f51823e927844a0fe8eb6
|
3 |
size 6319689
|
last-checkpoint/pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1121737121
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99997d8d83512acef3c4cbe1f65bcc63e923da9128d44d4f31a77fc2d2d0fa3e
|
3 |
size 1121737121
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14639
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b40c32b050066f0ed60185a04c440be4166655dfc5ba26d3739f1f40fb60f3fe
|
3 |
size 14639
|
last-checkpoint/scaler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 557
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd56176e725920af6b7720880038e0e973fdda3a8cf9ee899ad7b77393e85f3c
|
3 |
size 557
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 627
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5013dfcc679faef36ba1118629b5c9fa5b4e10806795066518618de7710eeb5d
|
3 |
size 627
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 0.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -144,11 +144,17 @@
|
|
144 |
"learning_rate": 1.514002245916253e-05,
|
145 |
"loss": 1.5341,
|
146 |
"step": 21000
|
|
|
|
|
|
|
|
|
|
|
|
|
147 |
}
|
148 |
],
|
149 |
"max_steps": 86379,
|
150 |
"num_train_epochs": 1,
|
151 |
-
"total_flos":
|
152 |
"trial_name": null,
|
153 |
"trial_params": null
|
154 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 0.25520091688952173,
|
5 |
+
"global_step": 22044,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
144 |
"learning_rate": 1.514002245916253e-05,
|
145 |
"loss": 1.5341,
|
146 |
"step": 21000
|
147 |
+
},
|
148 |
+
{
|
149 |
+
"epoch": 0.25,
|
150 |
+
"learning_rate": 1.4908484701142641e-05,
|
151 |
+
"loss": 1.519,
|
152 |
+
"step": 22000
|
153 |
}
|
154 |
],
|
155 |
"max_steps": 86379,
|
156 |
"num_train_epochs": 1,
|
157 |
+
"total_flos": 4.105134663951974e+16,
|
158 |
"trial_name": null,
|
159 |
"trial_params": null
|
160 |
}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1121737121
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99997d8d83512acef3c4cbe1f65bcc63e923da9128d44d4f31a77fc2d2d0fa3e
|
3 |
size 1121737121
|
runs/Jun04_02-06-39_4367d7224c9f/events.out.tfevents.1685845095.4367d7224c9f.857.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2af989065380892987dbfe17502796c97f4a74c8352c4ff71406a22cd9fcc7b8
|
3 |
+
size 6248
|