mrmuminov commited on
Commit
cb2905a
·
verified ·
1 Parent(s): 56110e2

End of training

Browse files
Files changed (3) hide show
  1. README.md +45 -23
  2. generation_config.json +6 -4
  3. model.safetensors +1 -1
README.md CHANGED
@@ -1,17 +1,17 @@
1
  ---
 
2
  language:
3
  - uz
4
  license: apache-2.0
5
  base_model: openai/whisper-small
6
  tags:
7
- - hf-asr-leaderboard
8
  - generated_from_trainer
9
  datasets:
10
  - mozilla-foundation/common_voice_16_1
11
  metrics:
12
  - wer
13
  model-index:
14
- - name: Whisper Small Uz - Bahriddin Mo'minov
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
@@ -25,18 +25,18 @@ model-index:
25
  metrics:
26
  - name: Wer
27
  type: wer
28
- value: 37.07903050585018
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
32
  should probably proofread and complete it, then remove this comment. -->
33
 
34
- # Whisper Small Uz - Bahriddin Mo'minov
35
 
36
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 16.1 dataset.
37
  It achieves the following results on the evaluation set:
38
- - Loss: 0.3759
39
- - Wer: 37.0790
40
 
41
  ## Model description
42
 
@@ -56,30 +56,52 @@ More information needed
56
 
57
  The following hyperparameters were used during training:
58
  - learning_rate: 1e-05
59
- - train_batch_size: 8
60
- - eval_batch_size: 4
61
  - seed: 42
62
- - gradient_accumulation_steps: 2
63
- - total_train_batch_size: 16
64
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
65
  - lr_scheduler_type: linear
66
- - lr_scheduler_warmup_steps: 500
67
- - training_steps: 4000
68
  - mixed_precision_training: Native AMP
69
 
70
  ### Training results
71
 
72
- | Training Loss | Epoch | Step | Validation Loss | Wer |
73
- |:-------------:|:-----:|:----:|:---------------:|:-------:|
74
- | 0.6057 | 0.26 | 1000 | 0.5283 | 46.5667 |
75
- | 0.436 | 0.53 | 2000 | 0.4354 | 42.1575 |
76
- | 0.4144 | 0.79 | 3000 | 0.3925 | 38.4788 |
77
- | 0.3194 | 1.06 | 4000 | 0.3759 | 37.0790 |
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
78
 
79
 
80
  ### Framework versions
81
 
82
- - Transformers 4.37.2
83
- - Pytorch 2.2.2+cu121
84
- - Datasets 2.18.0
85
- - Tokenizers 0.15.2
 
1
  ---
2
+ library_name: transformers
3
  language:
4
  - uz
5
  license: apache-2.0
6
  base_model: openai/whisper-small
7
  tags:
 
8
  - generated_from_trainer
9
  datasets:
10
  - mozilla-foundation/common_voice_16_1
11
  metrics:
12
  - wer
13
  model-index:
14
+ - name: Whisper Small UZ - Bahriddin Muminov
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
 
25
  metrics:
26
  - name: Wer
27
  type: wer
28
+ value: 24.46336925439856
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
32
  should probably proofread and complete it, then remove this comment. -->
33
 
34
+ # Whisper Small UZ - Bahriddin Muminov
35
 
36
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 16.1 dataset.
37
  It achieves the following results on the evaluation set:
38
+ - Loss: 0.2593
39
+ - Wer: 24.4634
40
 
41
  ## Model description
42
 
 
56
 
57
  The following hyperparameters were used during training:
58
  - learning_rate: 1e-05
59
+ - train_batch_size: 16
60
+ - eval_batch_size: 8
61
  - seed: 42
62
+ - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 
 
63
  - lr_scheduler_type: linear
64
+ - lr_scheduler_warmup_steps: 1000
65
+ - training_steps: 57000
66
  - mixed_precision_training: Native AMP
67
 
68
  ### Training results
69
 
70
+ | Training Loss | Epoch | Step | Validation Loss | Wer |
71
+ |:-------------:|:------:|:-----:|:---------------:|:-------:|
72
+ | 0.357 | 0.0352 | 2000 | 0.4996 | 42.0801 |
73
+ | 0.2917 | 0.0704 | 4000 | 0.4227 | 36.4010 |
74
+ | 0.2222 | 0.1056 | 6000 | 0.3806 | 36.8330 |
75
+ | 0.2127 | 0.1408 | 8000 | 0.3559 | 31.9044 |
76
+ | 0.2131 | 0.1760 | 10000 | 0.3392 | 32.2440 |
77
+ | 0.2283 | 0.2112 | 12000 | 0.3387 | 30.3111 |
78
+ | 0.2056 | 0.2464 | 14000 | 0.3301 | 29.3033 |
79
+ | 0.1956 | 0.2816 | 16000 | 0.3195 | 30.3610 |
80
+ | 0.1819 | 0.3168 | 18000 | 0.3076 | 30.7056 |
81
+ | 0.1969 | 0.3520 | 20000 | 0.3033 | 29.4395 |
82
+ | 0.156 | 0.3872 | 22000 | 0.3137 | 28.3081 |
83
+ | 0.1521 | 0.4224 | 24000 | 0.2946 | 28.2145 |
84
+ | 0.1736 | 0.4576 | 26000 | 0.2952 | 27.6800 |
85
+ | 0.1647 | 0.4928 | 28000 | 0.2889 | 26.7835 |
86
+ | 0.1596 | 0.5280 | 30000 | 0.2923 | 26.6998 |
87
+ | 0.1586 | 0.5632 | 32000 | 0.2821 | 26.6561 |
88
+ | 0.1299 | 0.5984 | 34000 | 0.2775 | 26.9783 |
89
+ | 0.1564 | 0.6336 | 36000 | 0.2811 | 26.4600 |
90
+ | 0.1525 | 0.6688 | 38000 | 0.2699 | 26.7485 |
91
+ | 0.1469 | 0.7041 | 40000 | 0.2699 | 26.2765 |
92
+ | 0.1362 | 0.7393 | 42000 | 0.2666 | 25.4761 |
93
+ | 0.1268 | 0.7745 | 44000 | 0.2590 | 26.6236 |
94
+ | 0.1389 | 0.8097 | 46000 | 0.2617 | 25.5485 |
95
+ | 0.1277 | 0.8449 | 48000 | 0.2600 | 24.7443 |
96
+ | 0.1312 | 0.8801 | 50000 | 0.2633 | 24.9579 |
97
+ | 0.1431 | 0.9153 | 52000 | 0.2604 | 24.8180 |
98
+ | 0.1366 | 0.9505 | 54000 | 0.2601 | 24.4384 |
99
+ | 0.1363 | 0.9857 | 56000 | 0.2593 | 24.4634 |
100
 
101
 
102
  ### Framework versions
103
 
104
+ - Transformers 4.49.0
105
+ - Pytorch 2.6.0+cu124
106
+ - Datasets 3.4.1
107
+ - Tokenizers 0.21.1
generation_config.json CHANGED
@@ -51,11 +51,15 @@
51
  "forced_decoder_ids": [
52
  [
53
  1,
54
- null
55
  ],
56
  [
57
  2,
58
  50359
 
 
 
 
59
  ]
60
  ],
61
  "is_multilingual": true,
@@ -250,8 +254,6 @@
250
  49870,
251
  50254,
252
  50258,
253
- 50358,
254
- 50359,
255
  50360,
256
  50361,
257
  50362
@@ -260,5 +262,5 @@
260
  "transcribe": 50359,
261
  "translate": 50358
262
  },
263
- "transformers_version": "4.37.2"
264
  }
 
51
  "forced_decoder_ids": [
52
  [
53
  1,
54
+ 50337
55
  ],
56
  [
57
  2,
58
  50359
59
+ ],
60
+ [
61
+ 3,
62
+ 50363
63
  ]
64
  ],
65
  "is_multilingual": true,
 
254
  49870,
255
  50254,
256
  50258,
 
 
257
  50360,
258
  50361,
259
  50362
 
262
  "transcribe": 50359,
263
  "translate": 50358
264
  },
265
+ "transformers_version": "4.49.0"
266
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:de867767fc6eaf2e6234a6b7ec854b66e0bba8f2f1a6a5202b3cee0100d7058f
3
  size 966995080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:235d9c59d4ecb2540a7b82c3ac4019d466a46586833c91f51d8d4c07556a2ff9
3
  size 966995080