dq158 commited on
Commit
c900c43
·
1 Parent(s): defe0c7

Training in progress, epoch 9, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d8e033f8dea1d357ffe6629c15f19815f5e32cd70953d97be45fc17aa0912ae
3
  size 2371770
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd19122e1b6607cdb79a7016978319f5233648dfa21d17f64f4c5ed9ebfab2b1
3
  size 2371770
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0d868b832fd968e13a3ef455165a190aba8506b04ef6b945c6e766f7ee84d1f
3
  size 990409330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20f9eff7f8c80652672f33d591daec33e74fa91afea6f63662fcce0b413fc45e
3
  size 990409330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:525e460409507e49b218a1b42d06d85873c630a5ed78eb21f16030edb00fde0c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b21196dd7454f3b651b63e42d3595da46748179b2ded600b1b8e0ecb74a09883
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d507458213a337e4449ea78916d032601a9ab5585183fda8bd21d6d89f7d231
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:429bbb7d8273481822c70b354c32cf6b2c09f778063e5299935515e96827f77b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 1.8215827941894531,
3
  "best_model_checkpoint": "dq158/pingusPongus/checkpoint-3162",
4
- "epoch": 8.0,
5
  "eval_steps": 500,
6
- "global_step": 25296,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -459,13 +459,68 @@
459
  "eval_steps_per_second": 0.605,
460
  "eval_translation_length": 52579,
461
  "step": 25296
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
462
  }
463
  ],
464
  "logging_steps": 500,
465
  "max_steps": 63240,
466
  "num_train_epochs": 20,
467
  "save_steps": 500,
468
- "total_flos": 1.3854558560609894e+17,
469
  "trial_name": null,
470
  "trial_params": null
471
  }
 
1
  {
2
  "best_metric": 1.8215827941894531,
3
  "best_model_checkpoint": "dq158/pingusPongus/checkpoint-3162",
4
+ "epoch": 9.0,
5
  "eval_steps": 500,
6
+ "global_step": 28458,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
459
  "eval_steps_per_second": 0.605,
460
  "eval_translation_length": 52579,
461
  "step": 25296
462
+ },
463
+ {
464
+ "epoch": 8.06,
465
+ "learning_rate": 3.283962902837673e-05,
466
+ "loss": 1.8288,
467
+ "step": 25500
468
+ },
469
+ {
470
+ "epoch": 8.22,
471
+ "learning_rate": 3.22428902702372e-05,
472
+ "loss": 1.7989,
473
+ "step": 26000
474
+ },
475
+ {
476
+ "epoch": 8.38,
477
+ "learning_rate": 3.164161167838985e-05,
478
+ "loss": 1.795,
479
+ "step": 26500
480
+ },
481
+ {
482
+ "epoch": 8.54,
483
+ "learning_rate": 3.103617013343307e-05,
484
+ "loss": 1.7786,
485
+ "step": 27000
486
+ },
487
+ {
488
+ "epoch": 8.7,
489
+ "learning_rate": 3.0426945125298563e-05,
490
+ "loss": 1.7924,
491
+ "step": 27500
492
+ },
493
+ {
494
+ "epoch": 8.86,
495
+ "learning_rate": 2.9814318515387547e-05,
496
+ "loss": 1.8087,
497
+ "step": 28000
498
+ },
499
+ {
500
+ "epoch": 9.0,
501
+ "eval_bleu": 1.0,
502
+ "eval_brevity_penalty": 1.0,
503
+ "eval_length_ratio": 1.0,
504
+ "eval_loss": 1.8519303798675537,
505
+ "eval_precisions": [
506
+ 1.0,
507
+ 1.0,
508
+ 1.0,
509
+ 1.0
510
+ ],
511
+ "eval_reference_length": 52432,
512
+ "eval_runtime": 580.9392,
513
+ "eval_samples_per_second": 4.839,
514
+ "eval_steps_per_second": 0.606,
515
+ "eval_translation_length": 52432,
516
+ "step": 28458
517
  }
518
  ],
519
  "logging_steps": 500,
520
  "max_steps": 63240,
521
  "num_train_epochs": 20,
522
  "save_steps": 500,
523
+ "total_flos": 1.558637838068613e+17,
524
  "trial_name": null,
525
  "trial_params": null
526
  }