dq158 commited on
Commit
d7b0fa2
·
1 Parent(s): acb3305

Training in progress, epoch 10, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce9ee458806a62ae72a1e4d5a5acc18de5a23f594846dc936e964bf32d34ebae
3
  size 2371770
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a439bb31358d05c083aec181dc04c10dbb5fcc668174b9ab393917d19d7ebaa3
3
  size 2371770
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94598a1ea1df407591b98594fea9e8dcf2043b9124d78c0764a36b0a04886f57
3
  size 990409330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0363553bd2c0b6be1229b2249a2e03d68d4405453c01a0107dc6d001f6d736c9
3
  size 990409330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b21196dd7454f3b651b63e42d3595da46748179b2ded600b1b8e0ecb74a09883
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37187fd0c8eed32cbc388563b490eb72c0ff986800302ec0ab6c19bdf8d63a37
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:686749d972d4e90f466b72f5a04d569779ab107826b090f5c435d2ae6efde530
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fde980dad26ff75414ed06027ec8ba5e7d484abbe46896b9304dc37a9238984f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 2.215216636657715,
3
- "best_model_checkpoint": "dq158/pingusPongus/checkpoint-14229",
4
- "epoch": 9.0,
5
  "eval_steps": 500,
6
- "global_step": 14229,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -346,13 +346,50 @@
346
  "eval_steps_per_second": 0.605,
347
  "eval_translation_length": 52546,
348
  "step": 14229
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
349
  }
350
  ],
351
  "logging_steps": 500,
352
  "max_steps": 31620,
353
  "num_train_epochs": 20,
354
  "save_steps": 500,
355
- "total_flos": 1.558637838068613e+17,
356
  "trial_name": null,
357
  "trial_params": null
358
  }
 
1
  {
2
+ "best_metric": 2.214895725250244,
3
+ "best_model_checkpoint": "dq158/pingusPongus/checkpoint-15810",
4
+ "epoch": 10.0,
5
  "eval_steps": 500,
6
+ "global_step": 15810,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
346
  "eval_steps_per_second": 0.605,
347
  "eval_translation_length": 52546,
348
  "step": 14229
349
+ },
350
+ {
351
+ "epoch": 9.17,
352
+ "learning_rate": 5.784166422325311e-05,
353
+ "loss": 2.0341,
354
+ "step": 14500
355
+ },
356
+ {
357
+ "epoch": 9.49,
358
+ "learning_rate": 5.534019366928e-05,
359
+ "loss": 2.0094,
360
+ "step": 15000
361
+ },
362
+ {
363
+ "epoch": 9.8,
364
+ "learning_rate": 5.282512040728659e-05,
365
+ "loss": 2.0032,
366
+ "step": 15500
367
+ },
368
+ {
369
+ "epoch": 10.0,
370
+ "eval_bleu": 1.0,
371
+ "eval_brevity_penalty": 1.0,
372
+ "eval_length_ratio": 1.0,
373
+ "eval_loss": 2.214895725250244,
374
+ "eval_precisions": [
375
+ 1.0,
376
+ 1.0,
377
+ 1.0,
378
+ 1.0
379
+ ],
380
+ "eval_reference_length": 52363,
381
+ "eval_runtime": 584.3355,
382
+ "eval_samples_per_second": 4.811,
383
+ "eval_steps_per_second": 0.602,
384
+ "eval_translation_length": 52363,
385
+ "step": 15810
386
  }
387
  ],
388
  "logging_steps": 500,
389
  "max_steps": 31620,
390
  "num_train_epochs": 20,
391
  "save_steps": 500,
392
+ "total_flos": 1.7318198200762368e+17,
393
  "trial_name": null,
394
  "trial_params": null
395
  }