tuanna08go commited on
Commit
68602f1
·
verified ·
1 Parent(s): 024d448

Training in progress, step 40, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24d71c509df481ce2b666570621cd4aeb0e74dbea1d6f4910bcb6b8b380212e4
3
  size 9568884
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc66a7721c18943169d4b3ee985fdcce10036fcd4bd982456a4bb5bba0de91a9
3
  size 9568884
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9c101bb52e4f809de6487fd71b71482099d5184955d481f2aa26d4c99dfba27
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb9fd29eefd5c42407ec295468332b1e9c3ce692abc97431dfed1b61fac9d9ca
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:49fa7e5c4bd2e7be73796ceecdd7226a0477f69897edbc4e406600122a0902ee
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:694a539f11c8d87dcdc9a0523d10086c9a55d2b245bea58f425e64a8cd3022da
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.09022556390977443,
5
  "eval_steps": 10,
6
- "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -60,6 +60,21 @@
60
  "eval_samples_per_second": 24.809,
61
  "eval_steps_per_second": 12.405,
62
  "step": 30
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  }
64
  ],
65
  "logging_steps": 10,
@@ -79,7 +94,7 @@
79
  "attributes": {}
80
  }
81
  },
82
- "total_flos": 523099212349440.0,
83
  "train_batch_size": 2,
84
  "trial_name": null,
85
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.12030075187969924,
5
  "eval_steps": 10,
6
+ "global_step": 40,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
60
  "eval_samples_per_second": 24.809,
61
  "eval_steps_per_second": 12.405,
62
  "step": 30
63
+ },
64
+ {
65
+ "epoch": 0.12030075187969924,
66
+ "grad_norm": NaN,
67
+ "learning_rate": 7.3223304703363135e-06,
68
+ "loss": 0.0,
69
+ "step": 40
70
+ },
71
+ {
72
+ "epoch": 0.12030075187969924,
73
+ "eval_loss": NaN,
74
+ "eval_runtime": 5.5475,
75
+ "eval_samples_per_second": 25.236,
76
+ "eval_steps_per_second": 12.618,
77
+ "step": 40
78
  }
79
  ],
80
  "logging_steps": 10,
 
94
  "attributes": {}
95
  }
96
  },
97
+ "total_flos": 694497677672448.0,
98
  "train_batch_size": 2,
99
  "trial_name": null,
100
  "trial_params": null