Training in progress, step 31200, checkpoint
Browse files
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 151061672
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3ee8fc37c8613bbb15872cad6ebad49ca223781551cccf5a1b9b0ad18467fb2
|
3 |
size 151061672
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 297616186
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5578d7a0245a2025bba82193aa01c8cf6a3ac806a390be8c513f15bda8c6fb22
|
3 |
size 297616186
|
last-checkpoint/rng_state.pth
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14244
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16441e71a883a73943f99a673ecfc9552a2d020fc5d218917df2611efe07b45a
|
3 |
size 14244
|
last-checkpoint/scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1064
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20a61eab882d9ff36fc3c0a98b9cf084dec17a3d477545149ce16194f0d294fe
|
3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"best_metric": 13.23946766594109,
|
3 |
"best_model_checkpoint": "./Whisper_tiny_fine_tune_Quran/checkpoint-28400",
|
4 |
-
"epoch": 10.
|
5 |
"eval_steps": 400,
|
6 |
-
"global_step":
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
@@ -5089,6 +5089,72 @@
|
|
5089 |
"eval_steps_per_second": 0.22,
|
5090 |
"eval_wer": 13.324883586366518,
|
5091 |
"step": 30800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5092 |
}
|
5093 |
],
|
5094 |
"logging_steps": 50,
|
@@ -5108,7 +5174,7 @@
|
|
5108 |
"attributes": {}
|
5109 |
}
|
5110 |
},
|
5111 |
-
"total_flos": 4.
|
5112 |
"train_batch_size": 16,
|
5113 |
"trial_name": null,
|
5114 |
"trial_params": null
|
|
|
1 |
{
|
2 |
"best_metric": 13.23946766594109,
|
3 |
"best_model_checkpoint": "./Whisper_tiny_fine_tune_Quran/checkpoint-28400",
|
4 |
+
"epoch": 10.985828712261245,
|
5 |
"eval_steps": 400,
|
6 |
+
"global_step": 31200,
|
7 |
"is_hyper_param_search": false,
|
8 |
"is_local_process_zero": true,
|
9 |
"is_world_process_zero": true,
|
|
|
5089 |
"eval_steps_per_second": 0.22,
|
5090 |
"eval_wer": 13.324883586366518,
|
5091 |
"step": 30800
|
5092 |
+
},
|
5093 |
+
{
|
5094 |
+
"epoch": 10.862600123228589,
|
5095 |
+
"grad_norm": 12202.451171875,
|
5096 |
+
"learning_rate": 3.9710352918137514e-08,
|
5097 |
+
"loss": 0.0009,
|
5098 |
+
"step": 30850
|
5099 |
+
},
|
5100 |
+
{
|
5101 |
+
"epoch": 10.880204207376112,
|
5102 |
+
"grad_norm": 41063.734375,
|
5103 |
+
"learning_rate": 3.018187139520734e-08,
|
5104 |
+
"loss": 0.0012,
|
5105 |
+
"step": 30900
|
5106 |
+
},
|
5107 |
+
{
|
5108 |
+
"epoch": 10.897808291523633,
|
5109 |
+
"grad_norm": 24295.453125,
|
5110 |
+
"learning_rate": 2.1958174560282595e-08,
|
5111 |
+
"loss": 0.0012,
|
5112 |
+
"step": 30950
|
5113 |
+
},
|
5114 |
+
{
|
5115 |
+
"epoch": 10.915412375671156,
|
5116 |
+
"grad_norm": 6690.68505859375,
|
5117 |
+
"learning_rate": 1.5039477146061577e-08,
|
5118 |
+
"loss": 0.001,
|
5119 |
+
"step": 31000
|
5120 |
+
},
|
5121 |
+
{
|
5122 |
+
"epoch": 10.933016459818678,
|
5123 |
+
"grad_norm": 11496.0478515625,
|
5124 |
+
"learning_rate": 9.4259598098001e-09,
|
5125 |
+
"loss": 0.001,
|
5126 |
+
"step": 31050
|
5127 |
+
},
|
5128 |
+
{
|
5129 |
+
"epoch": 10.9506205439662,
|
5130 |
+
"grad_norm": 6633.92529296875,
|
5131 |
+
"learning_rate": 5.117769128615279e-09,
|
5132 |
+
"loss": 0.0008,
|
5133 |
+
"step": 31100
|
5134 |
+
},
|
5135 |
+
{
|
5136 |
+
"epoch": 10.968224628113722,
|
5137 |
+
"grad_norm": 30724.099609375,
|
5138 |
+
"learning_rate": 2.11501759563304e-09,
|
5139 |
+
"loss": 0.0011,
|
5140 |
+
"step": 31150
|
5141 |
+
},
|
5142 |
+
{
|
5143 |
+
"epoch": 10.985828712261245,
|
5144 |
+
"grad_norm": 20161.490234375,
|
5145 |
+
"learning_rate": 4.1778361706268363e-10,
|
5146 |
+
"loss": 0.0011,
|
5147 |
+
"step": 31200
|
5148 |
+
},
|
5149 |
+
{
|
5150 |
+
"epoch": 10.985828712261245,
|
5151 |
+
"eval_cer": 4.058986198741961,
|
5152 |
+
"eval_loss": 0.014408305287361145,
|
5153 |
+
"eval_runtime": 1104.4483,
|
5154 |
+
"eval_samples_per_second": 3.501,
|
5155 |
+
"eval_steps_per_second": 0.219,
|
5156 |
+
"eval_wer": 13.302840768192215,
|
5157 |
+
"step": 31200
|
5158 |
}
|
5159 |
],
|
5160 |
"logging_steps": 50,
|
|
|
5174 |
"attributes": {}
|
5175 |
}
|
5176 |
},
|
5177 |
+
"total_flos": 4.9158989807616e+19,
|
5178 |
"train_batch_size": 16,
|
5179 |
"trial_name": null,
|
5180 |
"trial_params": null
|