kingabzpro
/

whisper-tiny-urdu

@@ -1,21 +1,82 @@
 ---
 base_model: openai/whisper-tiny
 tags:
-- text-generation-inference
-- transformers
-- unsloth
-- whisper
-license: apache-2.0
-language:
-- en
 ---
-# Uploaded finetuned  model
-- **Developed by:** kingabzpro
-- **License:** apache-2.0
-- **Finetuned from model :** openai/whisper-tiny
-This whisper model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library.
-[<img src="https://raw.githubusercontent.com/unslothai/unsloth/main/images/unsloth%20made%20with%20love.png" width="200"/>](https://github.com/unslothai/unsloth)

 ---
+library_name: transformers
+license: apache-2.0
 base_model: openai/whisper-tiny
 tags:
+- generated_from_trainer
+datasets:
+- common_voice_17_0
+metrics:
+- wer
+model-index:
+- name: whisper-tiny-urdu
+  results:
+  - task:
+      name: Automatic Speech Recognition
+      type: automatic-speech-recognition
+    dataset:
+      name: common_voice_17_0
+      type: common_voice_17_0
+      config: ur
+      split: test[:600]
+      args: ur
+    metrics:
+    - name: Wer
+      type: wer
+      value: 47.85287528005975
 ---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# whisper-tiny-urdu
+This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the common_voice_17_0 dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.7225
+- Wer: 47.8529
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 2e-05
+- train_batch_size: 32
+- eval_batch_size: 32
+- seed: 42
+- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
+- lr_scheduler_type: cosine
+- lr_scheduler_warmup_steps: 200
+- training_steps: 2500
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Wer     |
+|:-------------:|:------:|:----:|:---------------:|:-------:|
+| 0.6808        | 1.6949 | 500  | 0.7403          | 52.6699 |
+| 0.3948        | 3.3898 | 1000 | 0.6850          | 47.1247 |
+| 0.2873        | 5.0847 | 1500 | 0.6994          | 48.1516 |
+| 0.2024        | 6.7797 | 2000 | 0.7169          | 46.7326 |
+| 0.183         | 8.4746 | 2500 | 0.7225          | 47.8529 |
+### Framework versions
+- Transformers 4.51.3
+- Pytorch 2.6.0+cu124
+- Datasets 3.6.0
+- Tokenizers 0.21.1

generation_config.json CHANGED Viewed

@@ -25,7 +25,6 @@
       5
     ]
   ],
-  "attn_implementation": "sdpa",
   "begin_suppress_tokens": [
     220,
     50257
@@ -33,6 +32,16 @@
   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
@@ -135,18 +144,107 @@
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
-  "language": "<|ur|>",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
   "pad_token_id": 50257,
   "prev_sot_token_id": 50361,
   "return_timestamps": false,
-  "suppress_tokens": [],
   "task": "transcribe",
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358
   },
-  "transformers_version": "4.52.2"
 }

       5
     ]
   ],
   "begin_suppress_tokens": [
     220,
     50257
   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
+  "forced_decoder_ids": [
+    [
+      1,
+      null
+    ],
+    [
+      2,
+      50359
+    ]
+  ],
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
+  "language": "ur",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
   "pad_token_id": 50257,
   "prev_sot_token_id": 50361,
   "return_timestamps": false,
+  "suppress_tokens": [
+    1,
+    2,
+    7,
+    8,
+    9,
+    10,
+    14,
+    25,
+    26,
+    27,
+    28,
+    29,
+    31,
+    58,
+    59,
+    60,
+    61,
+    62,
+    63,
+    90,
+    91,
+    92,
+    93,
+    359,
+    503,
+    522,
+    542,
+    873,
+    893,
+    902,
+    918,
+    922,
+    931,
+    1350,
+    1853,
+    1982,
+    2460,
+    2627,
+    3246,
+    3253,
+    3268,
+    3536,
+    3846,
+    3961,
+    4183,
+    4667,
+    6585,
+    6647,
+    7273,
+    9061,
+    9383,
+    10428,
+    10929,
+    11938,
+    12033,
+    12331,
+    12562,
+    13793,
+    14157,
+    14635,
+    15265,
+    15618,
+    16553,
+    16604,
+    18362,
+    18956,
+    20075,
+    21675,
+    22520,
+    26130,
+    26161,
+    26435,
+    28279,
+    29464,
+    31650,
+    32302,
+    32470,
+    36865,
+    42863,
+    47425,
+    49870,
+    50254,
+    50258,
+    50358,
+    50359,
+    50360,
+    50361,
+    50362
+  ],
   "task": "transcribe",
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358
   },
+  "transformers_version": "4.51.3"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fd5779dfd56c52f55eec26b2167d7701a1f035d2da42c388289994c8be1a444e
 size 151061672

 version https://git-lfs.github.com/spec/v1
+oid sha256:07e3f2812fdefe613b9def521a807b89f095c1fbc13de75f68e71700ec0f796b
 size 151061672