kingabzpro commited on
Commit
d198d47
·
verified ·
1 Parent(s): 83ec359

End of training

Browse files
Files changed (3) hide show
  1. README.md +74 -13
  2. generation_config.json +102 -4
  3. model.safetensors +1 -1
README.md CHANGED
@@ -1,21 +1,82 @@
1
  ---
 
 
2
  base_model: openai/whisper-tiny
3
  tags:
4
- - text-generation-inference
5
- - transformers
6
- - unsloth
7
- - whisper
8
- license: apache-2.0
9
- language:
10
- - en
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  ---
12
 
13
- # Uploaded finetuned model
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
 
15
- - **Developed by:** kingabzpro
16
- - **License:** apache-2.0
17
- - **Finetuned from model :** openai/whisper-tiny
18
 
19
- This whisper model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library.
20
 
21
- [<img src="https://raw.githubusercontent.com/unslothai/unsloth/main/images/unsloth%20made%20with%20love.png" width="200"/>](https://github.com/unslothai/unsloth)
 
 
 
 
1
  ---
2
+ library_name: transformers
3
+ license: apache-2.0
4
  base_model: openai/whisper-tiny
5
  tags:
6
+ - generated_from_trainer
7
+ datasets:
8
+ - common_voice_17_0
9
+ metrics:
10
+ - wer
11
+ model-index:
12
+ - name: whisper-tiny-urdu
13
+ results:
14
+ - task:
15
+ name: Automatic Speech Recognition
16
+ type: automatic-speech-recognition
17
+ dataset:
18
+ name: common_voice_17_0
19
+ type: common_voice_17_0
20
+ config: ur
21
+ split: test[:600]
22
+ args: ur
23
+ metrics:
24
+ - name: Wer
25
+ type: wer
26
+ value: 47.85287528005975
27
  ---
28
 
29
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
30
+ should probably proofread and complete it, then remove this comment. -->
31
+
32
+ # whisper-tiny-urdu
33
+
34
+ This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the common_voice_17_0 dataset.
35
+ It achieves the following results on the evaluation set:
36
+ - Loss: 0.7225
37
+ - Wer: 47.8529
38
+
39
+ ## Model description
40
+
41
+ More information needed
42
+
43
+ ## Intended uses & limitations
44
+
45
+ More information needed
46
+
47
+ ## Training and evaluation data
48
+
49
+ More information needed
50
+
51
+ ## Training procedure
52
+
53
+ ### Training hyperparameters
54
+
55
+ The following hyperparameters were used during training:
56
+ - learning_rate: 2e-05
57
+ - train_batch_size: 32
58
+ - eval_batch_size: 32
59
+ - seed: 42
60
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
61
+ - lr_scheduler_type: cosine
62
+ - lr_scheduler_warmup_steps: 200
63
+ - training_steps: 2500
64
+ - mixed_precision_training: Native AMP
65
+
66
+ ### Training results
67
+
68
+ | Training Loss | Epoch | Step | Validation Loss | Wer |
69
+ |:-------------:|:------:|:----:|:---------------:|:-------:|
70
+ | 0.6808 | 1.6949 | 500 | 0.7403 | 52.6699 |
71
+ | 0.3948 | 3.3898 | 1000 | 0.6850 | 47.1247 |
72
+ | 0.2873 | 5.0847 | 1500 | 0.6994 | 48.1516 |
73
+ | 0.2024 | 6.7797 | 2000 | 0.7169 | 46.7326 |
74
+ | 0.183 | 8.4746 | 2500 | 0.7225 | 47.8529 |
75
 
 
 
 
76
 
77
+ ### Framework versions
78
 
79
+ - Transformers 4.51.3
80
+ - Pytorch 2.6.0+cu124
81
+ - Datasets 3.6.0
82
+ - Tokenizers 0.21.1
generation_config.json CHANGED
@@ -25,7 +25,6 @@
25
  5
26
  ]
27
  ],
28
- "attn_implementation": "sdpa",
29
  "begin_suppress_tokens": [
30
  220,
31
  50257
@@ -33,6 +32,16 @@
33
  "bos_token_id": 50257,
34
  "decoder_start_token_id": 50258,
35
  "eos_token_id": 50257,
 
 
 
 
 
 
 
 
 
 
36
  "is_multilingual": true,
37
  "lang_to_id": {
38
  "<|af|>": 50327,
@@ -135,18 +144,107 @@
135
  "<|yo|>": 50325,
136
  "<|zh|>": 50260
137
  },
138
- "language": "<|ur|>",
139
  "max_initial_timestamp_index": 50,
140
  "max_length": 448,
141
  "no_timestamps_token_id": 50363,
142
  "pad_token_id": 50257,
143
  "prev_sot_token_id": 50361,
144
  "return_timestamps": false,
145
- "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
146
  "task": "transcribe",
147
  "task_to_id": {
148
  "transcribe": 50359,
149
  "translate": 50358
150
  },
151
- "transformers_version": "4.52.2"
152
  }
 
25
  5
26
  ]
27
  ],
 
28
  "begin_suppress_tokens": [
29
  220,
30
  50257
 
32
  "bos_token_id": 50257,
33
  "decoder_start_token_id": 50258,
34
  "eos_token_id": 50257,
35
+ "forced_decoder_ids": [
36
+ [
37
+ 1,
38
+ null
39
+ ],
40
+ [
41
+ 2,
42
+ 50359
43
+ ]
44
+ ],
45
  "is_multilingual": true,
46
  "lang_to_id": {
47
  "<|af|>": 50327,
 
144
  "<|yo|>": 50325,
145
  "<|zh|>": 50260
146
  },
147
+ "language": "ur",
148
  "max_initial_timestamp_index": 50,
149
  "max_length": 448,
150
  "no_timestamps_token_id": 50363,
151
  "pad_token_id": 50257,
152
  "prev_sot_token_id": 50361,
153
  "return_timestamps": false,
154
+ "suppress_tokens": [
155
+ 1,
156
+ 2,
157
+ 7,
158
+ 8,
159
+ 9,
160
+ 10,
161
+ 14,
162
+ 25,
163
+ 26,
164
+ 27,
165
+ 28,
166
+ 29,
167
+ 31,
168
+ 58,
169
+ 59,
170
+ 60,
171
+ 61,
172
+ 62,
173
+ 63,
174
+ 90,
175
+ 91,
176
+ 92,
177
+ 93,
178
+ 359,
179
+ 503,
180
+ 522,
181
+ 542,
182
+ 873,
183
+ 893,
184
+ 902,
185
+ 918,
186
+ 922,
187
+ 931,
188
+ 1350,
189
+ 1853,
190
+ 1982,
191
+ 2460,
192
+ 2627,
193
+ 3246,
194
+ 3253,
195
+ 3268,
196
+ 3536,
197
+ 3846,
198
+ 3961,
199
+ 4183,
200
+ 4667,
201
+ 6585,
202
+ 6647,
203
+ 7273,
204
+ 9061,
205
+ 9383,
206
+ 10428,
207
+ 10929,
208
+ 11938,
209
+ 12033,
210
+ 12331,
211
+ 12562,
212
+ 13793,
213
+ 14157,
214
+ 14635,
215
+ 15265,
216
+ 15618,
217
+ 16553,
218
+ 16604,
219
+ 18362,
220
+ 18956,
221
+ 20075,
222
+ 21675,
223
+ 22520,
224
+ 26130,
225
+ 26161,
226
+ 26435,
227
+ 28279,
228
+ 29464,
229
+ 31650,
230
+ 32302,
231
+ 32470,
232
+ 36865,
233
+ 42863,
234
+ 47425,
235
+ 49870,
236
+ 50254,
237
+ 50258,
238
+ 50358,
239
+ 50359,
240
+ 50360,
241
+ 50361,
242
+ 50362
243
+ ],
244
  "task": "transcribe",
245
  "task_to_id": {
246
  "transcribe": 50359,
247
  "translate": 50358
248
  },
249
+ "transformers_version": "4.51.3"
250
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd5779dfd56c52f55eec26b2167d7701a1f035d2da42c388289994c8be1a444e
3
  size 151061672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07e3f2812fdefe613b9def521a807b89f095c1fbc13de75f68e71700ec0f796b
3
  size 151061672