cruiser commited on
Commit
33a3131
·
1 Parent(s): 81e03f6

Training in progress, epoch 23

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a1d14856e0cfb3f34f2130fddb5a5195a5056760e7d4e244f5ec5c205eeee3cb
3
  size 535707205
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f19c4553b42a58e1898154505a846984d098e14b79006fb5eed27495e5e9e0a2
3
  size 535707205
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff29f633a7c3a67e99ca9a38c7a19825b66fc233eda1dc51c4bcf49612959cbb
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8819018e912e7348b43972bdf60d10f3292458a47010f09ce53d46b7206f5d78
3
  size 267858605
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd8eae39f0bee668624497a8eebdf03882e75328eeedd8b5ea83e195f440ba0b
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdf2dcc1482a674a7d29c0d8020585b4fcba2dc290a0343584994f1846bef070
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd2d6f56c81a5ee3c56fc6aef2526c2295f62bbce13cdeb6632e7e8c8630fd77
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf241e967f6b1435a68fde6d92854ccf48d554078e8a1bd6f2ca95ccf48c323a
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 1.606531023979187,
3
  "best_model_checkpoint": "distilbert_final_tweet_dataset_200_epoch/checkpoint-230",
4
- "epoch": 21.0,
5
- "global_step": 2415,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -240,11 +240,37 @@
240
  "eval_samples_per_second": 437.091,
241
  "eval_steps_per_second": 55.311,
242
  "step": 2415
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
243
  }
244
  ],
245
  "max_steps": 23000,
246
  "num_train_epochs": 200,
247
- "total_flos": 779367727884564.0,
248
  "trial_name": null,
249
  "trial_params": null
250
  }
 
1
  {
2
  "best_metric": 1.606531023979187,
3
  "best_model_checkpoint": "distilbert_final_tweet_dataset_200_epoch/checkpoint-230",
4
+ "epoch": 23.0,
5
+ "global_step": 2645,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
240
  "eval_samples_per_second": 437.091,
241
  "eval_steps_per_second": 55.311,
242
  "step": 2415
243
+ },
244
+ {
245
+ "epoch": 21.74,
246
+ "learning_rate": 4.456521739130435e-05,
247
+ "loss": 0.0264,
248
+ "step": 2500
249
+ },
250
+ {
251
+ "epoch": 22.0,
252
+ "eval_accuracy": 0.6512345679012346,
253
+ "eval_f1": 0.6561078483445887,
254
+ "eval_loss": 2.6863272190093994,
255
+ "eval_runtime": 0.749,
256
+ "eval_samples_per_second": 432.552,
257
+ "eval_steps_per_second": 54.736,
258
+ "step": 2530
259
+ },
260
+ {
261
+ "epoch": 23.0,
262
+ "eval_accuracy": 0.6604938271604939,
263
+ "eval_f1": 0.6610722610722611,
264
+ "eval_loss": 2.7173354625701904,
265
+ "eval_runtime": 0.7384,
266
+ "eval_samples_per_second": 438.801,
267
+ "eval_steps_per_second": 55.527,
268
+ "step": 2645
269
  }
270
  ],
271
  "max_steps": 23000,
272
  "num_train_epochs": 200,
273
+ "total_flos": 853593225778332.0,
274
  "trial_name": null,
275
  "trial_params": null
276
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff29f633a7c3a67e99ca9a38c7a19825b66fc233eda1dc51c4bcf49612959cbb
3
  size 267858605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8819018e912e7348b43972bdf60d10f3292458a47010f09ce53d46b7206f5d78
3
  size 267858605
runs/May01_10-03-26_b04f269e142e/events.out.tfevents.1682935412.b04f269e142e.1987.2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e19fc058ef448e4e8598743891f2b006f8515bb32fc840641ca1ba59a7a3d348
3
- size 12540
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f23b42ef39af3d797d5799a602b65543922a862cc20d2ab0a37d676bada58f1
3
+ size 13435