EYEDOL commited on
Commit
5ce0d47
·
verified ·
1 Parent(s): 37dfbfa

End of training

Browse files
README.md CHANGED
@@ -12,7 +12,7 @@ datasets:
12
  metrics:
13
  - wer
14
  model-index:
15
- - name: Whisper-Small-SW-SWAHILI
16
  results:
17
  - task:
18
  name: Automatic Speech Recognition
@@ -26,18 +26,18 @@ model-index:
26
  metrics:
27
  - name: Wer
28
  type: wer
29
- value: 28.921534818493228
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
33
  should probably proofread and complete it, then remove this comment. -->
34
 
35
- # Whisper-Small-SW-SWAHILI
36
 
37
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 11.0 dataset.
38
  It achieves the following results on the evaluation set:
39
- - Loss: 0.4235
40
- - Wer: 28.9215
41
 
42
  ## Model description
43
 
@@ -63,15 +63,14 @@ The following hyperparameters were used during training:
63
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
64
  - lr_scheduler_type: linear
65
  - lr_scheduler_warmup_steps: 500
66
- - num_epochs: 2
67
  - mixed_precision_training: Native AMP
68
 
69
  ### Training results
70
 
71
  | Training Loss | Epoch | Step | Validation Loss | Wer |
72
  |:-------------:|:------:|:----:|:---------------:|:-------:|
73
- | 0.2925 | 0.8684 | 2000 | 0.4415 | 30.5814 |
74
- | 0.1532 | 1.7369 | 4000 | 0.4235 | 28.9215 |
75
 
76
 
77
  ### Framework versions
 
12
  metrics:
13
  - wer
14
  model-index:
15
+ - name: ASR_FROM_C3
16
  results:
17
  - task:
18
  name: Automatic Speech Recognition
 
26
  metrics:
27
  - name: Wer
28
  type: wer
29
+ value: 15.699933328735316
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
33
  should probably proofread and complete it, then remove this comment. -->
34
 
35
+ # ASR_FROM_C3
36
 
37
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 11.0 dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.2158
40
+ - Wer: 15.6999
41
 
42
  ## Model description
43
 
 
63
  - optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
64
  - lr_scheduler_type: linear
65
  - lr_scheduler_warmup_steps: 500
66
+ - num_epochs: 1
67
  - mixed_precision_training: Native AMP
68
 
69
  ### Training results
70
 
71
  | Training Loss | Epoch | Step | Validation Loss | Wer |
72
  |:-------------:|:------:|:----:|:---------------:|:-------:|
73
+ | 0.1344 | 0.8684 | 2000 | 0.2158 | 15.6999 |
 
74
 
75
 
76
  ### Framework versions
config.json CHANGED
@@ -41,7 +41,7 @@
41
  "scale_embedding": false,
42
  "torch_dtype": "float32",
43
  "transformers_version": "4.52.4",
44
- "use_cache": true,
45
  "use_weighted_layer_sum": false,
46
  "vocab_size": 51865
47
  }
 
41
  "scale_embedding": false,
42
  "torch_dtype": "float32",
43
  "transformers_version": "4.52.4",
44
+ "use_cache": false,
45
  "use_weighted_layer_sum": false,
46
  "vocab_size": 51865
47
  }
generation_config.json CHANGED
@@ -1,167 +1,17 @@
1
  {
2
- "alignment_heads": [
3
- [
4
- 5,
5
- 3
6
- ],
7
- [
8
- 5,
9
- 9
10
- ],
11
- [
12
- 8,
13
- 0
14
- ],
15
- [
16
- 8,
17
- 4
18
- ],
19
- [
20
- 8,
21
- 7
22
- ],
23
- [
24
- 8,
25
- 8
26
- ],
27
- [
28
- 9,
29
- 0
30
- ],
31
- [
32
- 9,
33
- 7
34
- ],
35
- [
36
- 9,
37
- 9
38
- ],
39
- [
40
- 10,
41
- 5
42
- ]
43
- ],
44
- "begin_suppress_tokens": [
45
- 220,
46
- 50257
47
- ],
48
  "bos_token_id": 50257,
49
  "decoder_start_token_id": 50258,
50
  "eos_token_id": 50257,
51
- "is_multilingual": true,
52
  "lang_to_id": {
53
- "<|af|>": 50327,
54
- "<|am|>": 50334,
55
- "<|ar|>": 50272,
56
- "<|as|>": 50350,
57
- "<|az|>": 50304,
58
- "<|ba|>": 50355,
59
- "<|be|>": 50330,
60
- "<|bg|>": 50292,
61
- "<|bn|>": 50302,
62
- "<|bo|>": 50347,
63
- "<|br|>": 50309,
64
- "<|bs|>": 50315,
65
- "<|ca|>": 50270,
66
- "<|cs|>": 50283,
67
- "<|cy|>": 50297,
68
- "<|da|>": 50285,
69
- "<|de|>": 50261,
70
- "<|el|>": 50281,
71
- "<|en|>": 50259,
72
- "<|es|>": 50262,
73
- "<|et|>": 50307,
74
- "<|eu|>": 50310,
75
- "<|fa|>": 50300,
76
- "<|fi|>": 50277,
77
- "<|fo|>": 50338,
78
- "<|fr|>": 50265,
79
- "<|gl|>": 50319,
80
- "<|gu|>": 50333,
81
- "<|haw|>": 50352,
82
- "<|ha|>": 50354,
83
- "<|he|>": 50279,
84
- "<|hi|>": 50276,
85
- "<|hr|>": 50291,
86
- "<|ht|>": 50339,
87
- "<|hu|>": 50286,
88
- "<|hy|>": 50312,
89
- "<|id|>": 50275,
90
- "<|is|>": 50311,
91
- "<|it|>": 50274,
92
- "<|ja|>": 50266,
93
- "<|jw|>": 50356,
94
- "<|ka|>": 50329,
95
- "<|kk|>": 50316,
96
- "<|km|>": 50323,
97
- "<|kn|>": 50306,
98
- "<|ko|>": 50264,
99
- "<|la|>": 50294,
100
- "<|lb|>": 50345,
101
- "<|ln|>": 50353,
102
- "<|lo|>": 50336,
103
- "<|lt|>": 50293,
104
- "<|lv|>": 50301,
105
- "<|mg|>": 50349,
106
- "<|mi|>": 50295,
107
- "<|mk|>": 50308,
108
- "<|ml|>": 50296,
109
- "<|mn|>": 50314,
110
- "<|mr|>": 50320,
111
- "<|ms|>": 50282,
112
- "<|mt|>": 50343,
113
- "<|my|>": 50346,
114
- "<|ne|>": 50313,
115
- "<|nl|>": 50271,
116
- "<|nn|>": 50342,
117
- "<|no|>": 50288,
118
- "<|oc|>": 50328,
119
- "<|pa|>": 50321,
120
- "<|pl|>": 50269,
121
- "<|ps|>": 50340,
122
- "<|pt|>": 50267,
123
- "<|ro|>": 50284,
124
- "<|ru|>": 50263,
125
- "<|sa|>": 50344,
126
- "<|sd|>": 50332,
127
- "<|si|>": 50322,
128
- "<|sk|>": 50298,
129
- "<|sl|>": 50305,
130
- "<|sn|>": 50324,
131
- "<|so|>": 50326,
132
- "<|sq|>": 50317,
133
- "<|sr|>": 50303,
134
- "<|su|>": 50357,
135
- "<|sv|>": 50273,
136
- "<|sw|>": 50318,
137
- "<|ta|>": 50287,
138
- "<|te|>": 50299,
139
- "<|tg|>": 50331,
140
- "<|th|>": 50289,
141
- "<|tk|>": 50341,
142
- "<|tl|>": 50348,
143
- "<|tr|>": 50268,
144
- "<|tt|>": 50351,
145
- "<|uk|>": 50280,
146
- "<|ur|>": 50290,
147
- "<|uz|>": 50337,
148
- "<|vi|>": 50278,
149
- "<|yi|>": 50335,
150
- "<|yo|>": 50325,
151
- "<|zh|>": 50260
152
  },
153
  "language": "sw",
154
- "max_initial_timestamp_index": 50,
155
- "max_length": 448,
156
- "no_timestamps_token_id": 50363,
157
  "pad_token_id": 50257,
158
- "prev_sot_token_id": 50361,
159
- "return_timestamps": false,
160
- "suppress_tokens": [],
161
  "task": "transcribe",
162
  "task_to_id": {
163
  "transcribe": 50359,
164
  "translate": 50358
165
  },
166
- "transformers_version": "4.52.4"
 
167
  }
 
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "bos_token_id": 50257,
3
  "decoder_start_token_id": 50258,
4
  "eos_token_id": 50257,
 
5
  "lang_to_id": {
6
+ "sw": 50357
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  },
8
  "language": "sw",
 
 
 
9
  "pad_token_id": 50257,
 
 
 
10
  "task": "transcribe",
11
  "task_to_id": {
12
  "transcribe": 50359,
13
  "translate": 50358
14
  },
15
+ "transformers_version": "4.52.4",
16
+ "use_cache": false
17
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cfa25fc5b77f8c3e57f604473cf4bd35f52d923c04509c0e887ff2d84b6d323d
3
  size 966995080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f0658bacea103517a8116ce163f7175eb5f69abe585f72ca966a49b1b2618fc
3
  size 966995080
runs/Aug11_05-57-33_fdc595d0574b/events.out.tfevents.1754891856.fdc595d0574b.19.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96a43d0d5de879d79a94582fb17b5b0116ead15be81dea5768b4a7b796f222e9
3
+ size 6549
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:477d35287b2e29852132f5582cd65cd10e4c08e416fe5b54a67630453eab8b35
3
  size 5432
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ddd7fd327eea9e40930d64ae1aca3b22eceb638ae13308746e0ded8608762d4
3
  size 5432