Baselhany commited on
Commit
83138ce
·
verified ·
1 Parent(s): 4a8fc7c

Training in progress, step 31200, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:acfd926d6cc58589af2d096740d97bcaea3b4dc253655f4dc43910ed29399fae
3
  size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3ee8fc37c8613bbb15872cad6ebad49ca223781551cccf5a1b9b0ad18467fb2
3
  size 151061672
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:37f3d55a7903da147a3527941d27ae69b469e58bf862576ccfcbac4a3d1f9707
3
  size 297616186
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5578d7a0245a2025bba82193aa01c8cf6a3ac806a390be8c513f15bda8c6fb22
3
  size 297616186
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbb2a44ab7b4e7367def970d0740c81d46b38b4a0ba3a5a59d2bb9805d079b6c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16441e71a883a73943f99a673ecfc9552a2d020fc5d218917df2611efe07b45a
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d1d681d3c9dbf5bf4a58cd614b5037f58b217c9c938438c418d64757c1541e9f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20a61eab882d9ff36fc3c0a98b9cf084dec17a3d477545149ce16194f0d294fe
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": 13.23946766594109,
3
  "best_model_checkpoint": "./Whisper_tiny_fine_tune_Quran/checkpoint-28400",
4
- "epoch": 10.844996039081067,
5
  "eval_steps": 400,
6
- "global_step": 30800,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5089,6 +5089,72 @@
5089
  "eval_steps_per_second": 0.22,
5090
  "eval_wer": 13.324883586366518,
5091
  "step": 30800
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5092
  }
5093
  ],
5094
  "logging_steps": 50,
@@ -5108,7 +5174,7 @@
5108
  "attributes": {}
5109
  }
5110
  },
5111
- "total_flos": 4.8528746348544e+19,
5112
  "train_batch_size": 16,
5113
  "trial_name": null,
5114
  "trial_params": null
 
1
  {
2
  "best_metric": 13.23946766594109,
3
  "best_model_checkpoint": "./Whisper_tiny_fine_tune_Quran/checkpoint-28400",
4
+ "epoch": 10.985828712261245,
5
  "eval_steps": 400,
6
+ "global_step": 31200,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5089
  "eval_steps_per_second": 0.22,
5090
  "eval_wer": 13.324883586366518,
5091
  "step": 30800
5092
+ },
5093
+ {
5094
+ "epoch": 10.862600123228589,
5095
+ "grad_norm": 12202.451171875,
5096
+ "learning_rate": 3.9710352918137514e-08,
5097
+ "loss": 0.0009,
5098
+ "step": 30850
5099
+ },
5100
+ {
5101
+ "epoch": 10.880204207376112,
5102
+ "grad_norm": 41063.734375,
5103
+ "learning_rate": 3.018187139520734e-08,
5104
+ "loss": 0.0012,
5105
+ "step": 30900
5106
+ },
5107
+ {
5108
+ "epoch": 10.897808291523633,
5109
+ "grad_norm": 24295.453125,
5110
+ "learning_rate": 2.1958174560282595e-08,
5111
+ "loss": 0.0012,
5112
+ "step": 30950
5113
+ },
5114
+ {
5115
+ "epoch": 10.915412375671156,
5116
+ "grad_norm": 6690.68505859375,
5117
+ "learning_rate": 1.5039477146061577e-08,
5118
+ "loss": 0.001,
5119
+ "step": 31000
5120
+ },
5121
+ {
5122
+ "epoch": 10.933016459818678,
5123
+ "grad_norm": 11496.0478515625,
5124
+ "learning_rate": 9.4259598098001e-09,
5125
+ "loss": 0.001,
5126
+ "step": 31050
5127
+ },
5128
+ {
5129
+ "epoch": 10.9506205439662,
5130
+ "grad_norm": 6633.92529296875,
5131
+ "learning_rate": 5.117769128615279e-09,
5132
+ "loss": 0.0008,
5133
+ "step": 31100
5134
+ },
5135
+ {
5136
+ "epoch": 10.968224628113722,
5137
+ "grad_norm": 30724.099609375,
5138
+ "learning_rate": 2.11501759563304e-09,
5139
+ "loss": 0.0011,
5140
+ "step": 31150
5141
+ },
5142
+ {
5143
+ "epoch": 10.985828712261245,
5144
+ "grad_norm": 20161.490234375,
5145
+ "learning_rate": 4.1778361706268363e-10,
5146
+ "loss": 0.0011,
5147
+ "step": 31200
5148
+ },
5149
+ {
5150
+ "epoch": 10.985828712261245,
5151
+ "eval_cer": 4.058986198741961,
5152
+ "eval_loss": 0.014408305287361145,
5153
+ "eval_runtime": 1104.4483,
5154
+ "eval_samples_per_second": 3.501,
5155
+ "eval_steps_per_second": 0.219,
5156
+ "eval_wer": 13.302840768192215,
5157
+ "step": 31200
5158
  }
5159
  ],
5160
  "logging_steps": 50,
 
5174
  "attributes": {}
5175
  }
5176
  },
5177
+ "total_flos": 4.9158989807616e+19,
5178
  "train_batch_size": 16,
5179
  "trial_name": null,
5180
  "trial_params": null