GogetaBlueMUI
/

whisper-small-ur

@@ -7,7 +7,7 @@ base_model: openai/whisper-small
 tags:
 - generated_from_trainer
 datasets:
-- mozilla-foundation/common_voice_11_0
 metrics:
 - wer
 model-index:
@@ -17,15 +17,15 @@ model-index:
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
     dataset:
-      name: Common Voice 11.0
-      type: mozilla-foundation/common_voice_11_0
       config: ur
       split: test
       args: 'config: ur, split: test'
     metrics:
     - name: Wer
       type: wer
-      value: 35.41545725453771
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -33,10 +33,10 @@ should probably proofread and complete it, then remove this comment. -->
 # Whisper Small Ur - Muhammad Abdullah
-This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 11.0 dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.6090
-- Wer: 35.4155
 ## Model description
@@ -55,28 +55,27 @@ More information needed
 ### Training hyperparameters
 The following hyperparameters were used during training:
-- learning_rate: 1e-05
 - train_batch_size: 16
 - eval_batch_size: 8
 - seed: 42
 - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
-- lr_scheduler_warmup_steps: 500
-- training_steps: 1200
 - mixed_precision_training: Native AMP
 ### Training results
-| Training Loss | Epoch  | Step | Validation Loss | Wer     |
-|:-------------:|:------:|:----:|:---------------:|:-------:|
-| 0.451         | 1.5444 | 400  | 0.6250          | 39.7229 |
-| 0.133         | 3.0888 | 800  | 0.5866          | 37.1028 |
-| 0.0726        | 4.6332 | 1200 | 0.6090          | 35.4155 |
 ### Framework versions
-- Transformers 4.47.0
 - Pytorch 2.5.1+cu121
-- Datasets 3.1.0
 - Tokenizers 0.21.0

 tags:
 - generated_from_trainer
 datasets:
+- mozilla-foundation/common_voice_17_0
 metrics:
 - wer
 model-index:
       name: Automatic Speech Recognition
       type: automatic-speech-recognition
     dataset:
+      name: Common Voice 17.0
+      type: mozilla-foundation/common_voice_17_0
       config: ur
       split: test
       args: 'config: ur, split: test'
     metrics:
     - name: Wer
       type: wer
+      value: 92.16802838986547
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # Whisper Small Ur - Muhammad Abdullah
+This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 17.0 dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6097
+- Wer: 92.1680
 ## Model description
 ### Training hyperparameters
 The following hyperparameters were used during training:
+- learning_rate: 5e-06
 - train_batch_size: 16
 - eval_batch_size: 8
 - seed: 42
 - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
+- lr_scheduler_warmup_steps: 100
+- training_steps: 500
 - mixed_precision_training: Native AMP
 ### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Wer      |
+|:-------------:|:------:|:----:|:---------------:|:--------:|
+| 0.6086        | 0.7440 | 250  | 0.6541          | 102.7675 |
+| 0.4791        | 1.4881 | 500  | 0.6097          | 92.1680  |
 ### Framework versions
+- Transformers 4.47.1
 - Pytorch 2.5.1+cu121
+- Datasets 3.2.0
 - Tokenizers 0.21.0

generation_config.json CHANGED Viewed

@@ -160,7 +160,6 @@
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
-  "language": "ur",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
@@ -255,10 +254,9 @@
     50361,
     50362
   ],
-  "task": "transcribe",
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358
   },
-  "transformers_version": "4.47.0"
 }

     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
     50361,
     50362
   ],
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358
   },
+  "transformers_version": "4.47.1"
 }