lkhagvaa12 commited on
Commit
61522d4
·
verified ·
1 Parent(s): 4ecb771

End of training

Browse files
Files changed (2) hide show
  1. README.md +6 -6
  2. generation_config.json +100 -2
README.md CHANGED
@@ -18,9 +18,9 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.5638
22
- - Wer Ortho: 63.8900
23
- - Wer: 63.8689
24
 
25
  ## Model description
26
 
@@ -46,19 +46,19 @@ The following hyperparameters were used during training:
46
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
47
  - lr_scheduler_type: constant_with_warmup
48
  - lr_scheduler_warmup_steps: 50
49
- - training_steps: 1000
50
  - mixed_precision_training: Native AMP
51
 
52
  ### Training results
53
 
54
  | Training Loss | Epoch | Step | Validation Loss | Wer Ortho | Wer |
55
  |:-------------:|:------:|:----:|:---------------:|:---------:|:-------:|
56
- | 0.3486 | 4.9505 | 1000 | 0.5638 | 63.8900 | 63.8689 |
57
 
58
 
59
  ### Framework versions
60
 
61
- - Transformers 4.51.3
62
  - Pytorch 2.6.0+cu124
63
  - Datasets 3.6.0
64
  - Tokenizers 0.21.2
 
18
 
19
  This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 2.1113
22
+ - Wer Ortho: 99.7982
23
+ - Wer: 99.7579
24
 
25
  ## Model description
26
 
 
46
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
47
  - lr_scheduler_type: constant_with_warmup
48
  - lr_scheduler_warmup_steps: 50
49
+ - training_steps: 500
50
  - mixed_precision_training: Native AMP
51
 
52
  ### Training results
53
 
54
  | Training Loss | Epoch | Step | Validation Loss | Wer Ortho | Wer |
55
  |:-------------:|:------:|:----:|:---------------:|:---------:|:-------:|
56
+ | 0.7937 | 1.9531 | 500 | 2.1113 | 99.7982 | 99.7579 |
57
 
58
 
59
  ### Framework versions
60
 
61
+ - Transformers 4.52.4
62
  - Pytorch 2.6.0+cu124
63
  - Datasets 3.6.0
64
  - Tokenizers 0.21.2
generation_config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_from_model_config": true,
3
  "alignment_heads": [
4
  [
5
  2,
@@ -33,6 +32,16 @@
33
  "bos_token_id": 50257,
34
  "decoder_start_token_id": 50258,
35
  "eos_token_id": 50257,
 
 
 
 
 
 
 
 
 
 
36
  "is_multilingual": true,
37
  "lang_to_id": {
38
  "<|af|>": 50327,
@@ -141,7 +150,96 @@
141
  "pad_token_id": 50257,
142
  "prev_sot_token_id": 50361,
143
  "return_timestamps": false,
144
- "suppress_tokens": [],
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
145
  "task_to_id": {
146
  "transcribe": 50359,
147
  "translate": 50358
 
1
  {
 
2
  "alignment_heads": [
3
  [
4
  2,
 
32
  "bos_token_id": 50257,
33
  "decoder_start_token_id": 50258,
34
  "eos_token_id": 50257,
35
+ "forced_decoder_ids": [
36
+ [
37
+ 1,
38
+ null
39
+ ],
40
+ [
41
+ 2,
42
+ 50359
43
+ ]
44
+ ],
45
  "is_multilingual": true,
46
  "lang_to_id": {
47
  "<|af|>": 50327,
 
150
  "pad_token_id": 50257,
151
  "prev_sot_token_id": 50361,
152
  "return_timestamps": false,
153
+ "suppress_tokens": [
154
+ 1,
155
+ 2,
156
+ 7,
157
+ 8,
158
+ 9,
159
+ 10,
160
+ 14,
161
+ 25,
162
+ 26,
163
+ 27,
164
+ 28,
165
+ 29,
166
+ 31,
167
+ 58,
168
+ 59,
169
+ 60,
170
+ 61,
171
+ 62,
172
+ 63,
173
+ 90,
174
+ 91,
175
+ 92,
176
+ 93,
177
+ 359,
178
+ 503,
179
+ 522,
180
+ 542,
181
+ 873,
182
+ 893,
183
+ 902,
184
+ 918,
185
+ 922,
186
+ 931,
187
+ 1350,
188
+ 1853,
189
+ 1982,
190
+ 2460,
191
+ 2627,
192
+ 3246,
193
+ 3253,
194
+ 3268,
195
+ 3536,
196
+ 3846,
197
+ 3961,
198
+ 4183,
199
+ 4667,
200
+ 6585,
201
+ 6647,
202
+ 7273,
203
+ 9061,
204
+ 9383,
205
+ 10428,
206
+ 10929,
207
+ 11938,
208
+ 12033,
209
+ 12331,
210
+ 12562,
211
+ 13793,
212
+ 14157,
213
+ 14635,
214
+ 15265,
215
+ 15618,
216
+ 16553,
217
+ 16604,
218
+ 18362,
219
+ 18956,
220
+ 20075,
221
+ 21675,
222
+ 22520,
223
+ 26130,
224
+ 26161,
225
+ 26435,
226
+ 28279,
227
+ 29464,
228
+ 31650,
229
+ 32302,
230
+ 32470,
231
+ 36865,
232
+ 42863,
233
+ 47425,
234
+ 49870,
235
+ 50254,
236
+ 50258,
237
+ 50358,
238
+ 50359,
239
+ 50360,
240
+ 50361,
241
+ 50362
242
+ ],
243
  "task_to_id": {
244
  "transcribe": 50359,
245
  "translate": 50358