dq158 commited on
Commit
b4f2d25
·
1 Parent(s): e04293a

Training in progress, epoch 5, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8b1f3b82e6184cf3fa1f97e3633ed652219d243ea18fef27a35a38877c4c498c
3
  size 2371770
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b97ff2c46e83b02c5dac9aef9f59c66bb654fc31cf4601ff87ff73224691566
3
  size 2371770
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:63200bebd3227b384c5ba52c132d7b8ab92410896734805be9e58058c777ae71
3
  size 990409330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:538c6afe3af4e0e1ffd7998f1e019f18fbd60f4e2b15c398e1ec3b1435f65d6e
3
  size 990409330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce000429344a01e02536fd43d4c586bca70568f5e5b5ee181c3030c0d0aae5bd
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b54ac781bcf42bd5774e68cd27f8b47ba97a92bc3e5e5b5762ae0f9660c2d4e6
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:845ca0614dd5d49345c95c404b37a30ec6d95611e0a635ec0ac26e0a4196186d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b57d4c861df932544616bc97fdff1b5095cad53562dd214e165dfc55a56cc480
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.257721424102783,
3
- "best_model_checkpoint": "dq158/pingusPongus/checkpoint-6324",
4
- "epoch": 4.0,
5
  "eval_steps": 500,
6
- "global_step": 6324,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -155,13 +155,50 @@
155
  "eval_steps_per_second": 0.607,
156
  "eval_translation_length": 53121,
157
  "step": 6324
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
158
  }
159
  ],
160
  "logging_steps": 500,
161
  "max_steps": 31620,
162
  "num_train_epochs": 20,
163
  "save_steps": 500,
164
- "total_flos": 6.927279280304947e+16,
165
  "trial_name": null,
166
  "trial_params": null
167
  }
 
1
  {
2
+ "best_metric": 2.240872383117676,
3
+ "best_model_checkpoint": "dq158/pingusPongus/checkpoint-7905",
4
+ "epoch": 5.0,
5
  "eval_steps": 500,
6
+ "global_step": 7905,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
155
  "eval_steps_per_second": 0.607,
156
  "eval_translation_length": 53121,
157
  "step": 6324
158
+ },
159
+ {
160
+ "epoch": 4.11,
161
+ "learning_rate": 9.110503086981956e-05,
162
+ "loss": 2.2444,
163
+ "step": 6500
164
+ },
165
+ {
166
+ "epoch": 4.43,
167
+ "learning_rate": 8.961639836966304e-05,
168
+ "loss": 2.2152,
169
+ "step": 7000
170
+ },
171
+ {
172
+ "epoch": 4.74,
173
+ "learning_rate": 8.802685374286608e-05,
174
+ "loss": 2.2,
175
+ "step": 7500
176
+ },
177
+ {
178
+ "epoch": 5.0,
179
+ "eval_bleu": 1.0,
180
+ "eval_brevity_penalty": 1.0,
181
+ "eval_length_ratio": 1.0,
182
+ "eval_loss": 2.240872383117676,
183
+ "eval_precisions": [
184
+ 1.0,
185
+ 1.0,
186
+ 1.0,
187
+ 1.0
188
+ ],
189
+ "eval_reference_length": 52857,
190
+ "eval_runtime": 579.7989,
191
+ "eval_samples_per_second": 4.848,
192
+ "eval_steps_per_second": 0.607,
193
+ "eval_translation_length": 52857,
194
+ "step": 7905
195
  }
196
  ],
197
  "logging_steps": 500,
198
  "max_steps": 31620,
199
  "num_train_epochs": 20,
200
  "save_steps": 500,
201
+ "total_flos": 8.659099100381184e+16,
202
  "trial_name": null,
203
  "trial_params": null
204
  }