Saving weights and log at step 940000
Browse files- README.md +1 -1
- flax_model.msgpack +1 -1
- opt_state.msgpack +1 -1
- pytorch_model.bin +1 -1
- runs/events.out.tfevents.1641156371.t1v-n-2f64d7c8-w-0.13342.0.v2 +2 -2
- training_state.json +1 -1
README.md
CHANGED
@@ -30,7 +30,7 @@ Tokenizer:
|
|
30 |
Training details:
|
31 |
|
32 |
* Trained for 70K steps (batch size 64) to ppl 27 on mc4 nl tiny 1 epoch
|
33 |
-
* Trained for
|
34 |
* Training continuing
|
35 |
* Block size: 512
|
36 |
* Optimizer: adafactor
|
|
|
30 |
Training details:
|
31 |
|
32 |
* Trained for 70K steps (batch size 64) to ppl 27 on mc4 nl tiny 1 epoch
|
33 |
+
* Trained for 940K steps (batch size 16) to ppl 16.1 on mc4 nl full
|
34 |
* Training continuing
|
35 |
* Block size: 512
|
36 |
* Optimizer: adafactor
|
flax_model.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5262314590
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fc6108ceb04b0eb260bb51e05c838bfe34edb9dae95beb56b8ee0188fb40d74
|
3 |
size 5262314590
|
opt_state.msgpack
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5778100
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78016f9de2503a950519f04f279d254035f8fb347e507eb2c8745626f07d9340
|
3 |
size 5778100
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5363100545
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:142e35c1e7519d17d1f81c70452f6395dae97c9f47078469a81f398744893181
|
3 |
size 5363100545
|
runs/events.out.tfevents.1641156371.t1v-n-2f64d7c8-w-0.13342.0.v2
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3cb59e175ed446f3a057a221aaab3eed4ab0a69effd75db86b78e074d3b7062
|
3 |
+
size 141080779
|
training_state.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"step":
|
|
|
1 |
+
{"step": 940001}
|