bayartsogt commited on
Commit
c6e7f07
1 Parent(s): 3f32fd0

Saving weights and logs of epoch 1

Browse files
events.out.tfevents.1625632941.t1v-n-ca847b55-w-0.49210.3.v2 → events.out.tfevents.1625674769.t1v-n-ca847b55-w-0.91545.3.v2 RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b17c320d2f2ccace9c38fd88a3ef4a114df53aefd4904e36549a3eec77c43721
3
- size 9234766
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:837c365d9c67da98fc50d9acda6076378c1a0eb71eb281fcfb76b93d3ba93642
3
+ size 219942
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8aa0221d54f09a9b23b964b520583bc0baa5fdfc555f1b6310ec01c693bd38d1
3
  size 1421662309
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a97adc24bbd87f0e7925f9743b0cfe15275a652d8e8b11d1c842e814c81063da
3
  size 1421662309
train_mlm.sh CHANGED
@@ -9,7 +9,7 @@
9
  --weight_decay="0.01" \
10
  --per_device_train_batch_size="64" \
11
  --per_device_eval_batch_size="64" \
12
- --learning_rate="3e-4" \
13
  --warmup_steps="1000" \
14
  --overwrite_output_dir \
15
  --pad_to_max_length \
 
9
  --weight_decay="0.01" \
10
  --per_device_train_batch_size="64" \
11
  --per_device_eval_batch_size="64" \
12
+ --learning_rate="5e-5" \
13
  --warmup_steps="1000" \
14
  --overwrite_output_dir \
15
  --pad_to_max_length \