End of training

Files changed (6) hide show

README.md CHANGED Viewed

@@ -2,7 +2,7 @@
 language:
 - yo
 license: apache-2.0
-base_model: openai/whisper-small
 tags:
 - whisper-event
 - generated_from_trainer
@@ -25,7 +25,7 @@ model-index:
     metrics:
     - name: Wer
       type: wer
-      value: 51.071878940731395
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,10 +33,10 @@ should probably proofread and complete it, then remove this comment. -->
 # WhisperYoruba
-This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 17.0 dataset.
 It achieves the following results on the evaluation set:
-- Loss: 1.0256
-- Wer: 51.0719
 ## Model description
@@ -62,16 +62,14 @@ The following hyperparameters were used during training:
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
-- training_steps: 3500
 - mixed_precision_training: Native AMP
 ### Training results
-| Training Loss | Epoch   | Step | Validation Loss | Wer     |
-|:-------------:|:-------:|:----:|:---------------:|:-------:|
-| 0.2736        | 3.8462  | 1000 | 0.7361          | 51.3661 |
-| 0.0192        | 7.6923  | 2000 | 0.9077          | 51.7697 |
-| 0.0013        | 11.5385 | 3000 | 1.0256          | 51.0719 |
 ### Framework versions

 language:
 - yo
 license: apache-2.0
+base_model: openai/whisper-medium
 tags:
 - whisper-event
 - generated_from_trainer
     metrics:
     - name: Wer
       type: wer
+      value: 64.04371584699453
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # WhisperYoruba
+This model is a fine-tuned version of [openai/whisper-medium](https://huggingface.co/openai/whisper-medium) on the Common Voice 17.0 dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6691
+- Wer: 64.0437
 ## Model description
 - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: linear
 - lr_scheduler_warmup_steps: 500
+- training_steps: 1000
 - mixed_precision_training: Native AMP
 ### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Wer     |
+|:-------------:|:------:|:----:|:---------------:|:-------:|
+| 0.1301        | 3.8462 | 1000 | 0.6691          | 64.0437 |
 ### Framework versions

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "openai/whisper-small",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "apply_spec_augment": false,
@@ -13,17 +13,17 @@
   ],
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
-  "d_model": 768,
-  "decoder_attention_heads": 12,
-  "decoder_ffn_dim": 3072,
   "decoder_layerdrop": 0.0,
-  "decoder_layers": 12,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
-  "encoder_attention_heads": 12,
-  "encoder_ffn_dim": 3072,
   "encoder_layerdrop": 0.0,
-  "encoder_layers": 12,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
@@ -39,7 +39,7 @@
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
-  "num_hidden_layers": 12,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,

 {
+  "_name_or_path": "openai/whisper-medium",
   "activation_dropout": 0.0,
   "activation_function": "gelu",
   "apply_spec_augment": false,
   ],
   "bos_token_id": 50257,
   "classifier_proj_size": 256,
+  "d_model": 1024,
+  "decoder_attention_heads": 16,
+  "decoder_ffn_dim": 4096,
   "decoder_layerdrop": 0.0,
+  "decoder_layers": 24,
   "decoder_start_token_id": 50258,
   "dropout": 0.0,
+  "encoder_attention_heads": 16,
+  "encoder_ffn_dim": 4096,
   "encoder_layerdrop": 0.0,
+  "encoder_layers": 24,
   "eos_token_id": 50257,
   "forced_decoder_ids": null,
   "init_std": 0.02,
   "max_target_positions": 448,
   "median_filter_width": 7,
   "model_type": "whisper",
+  "num_hidden_layers": 24,
   "num_mel_bins": 80,
   "pad_token_id": 50257,
   "scale_embedding": false,

generation_config.json CHANGED Viewed

@@ -1,44 +1,28 @@
 {
   "alignment_heads": [
     [
-      5,
-      3
     ],
     [
-      5,
-      9
-    ],
-    [
-      8,
-      0
-    ],
-    [
-      8,
       4
     ],
     [
-      8,
-      7
     ],
     [
-      8,
-      8
     ],
     [
-      9,
       0
     ],
     [
-      9,
-      7
-    ],
-    [
-      9,
-      9
-    ],
-    [
-      10,
-      5
     ]
   ],
   "begin_suppress_tokens": [

 {
   "alignment_heads": [
     [
+      13,
+      15
     ],
     [
+      15,
       4
     ],
     [
+      15,
+      15
     ],
     [
+      16,
+      1
     ],
     [
+      20,
       0
     ],
     [
+      23,
+      4
     ]
   ],
   "begin_suppress_tokens": [

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2aaeb6a9f5453ef8c9f10b121fbe891589b8db71fe7ad22a0280817e9efe11fb
-size 966995080

 version https://git-lfs.github.com/spec/v1
+oid sha256:46a7df1c1a237abf95ba1a0540d55a37894957964cac259c15fbae1e38ed241f
+size 3055544304

runs/Jan10_20-51-02_c3ff67a08b40/events.out.tfevents.1736542265.c3ff67a08b40.24.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:805baccd030d1cfc41ee4d2fabd3bb108c293bd8380a2d8cd2a8ddfe936e00fe
+size 14722

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:507d9af32281a031478aa4873225c61c2461c1d40d112876f755518e69632be0
 size 5240

 version https://git-lfs.github.com/spec/v1
+oid sha256:892cb92fd398740902173be6a42eb0425a68d750c9d5ba13deebb182ebe69d0d
 size 5240