zuazo commited on
Commit
27bbc22
·
verified ·
1 Parent(s): b5934c5

Model save

Browse files
Files changed (2) hide show
  1. README.md +19 -21
  2. generation_config.json +3 -2
README.md CHANGED
@@ -1,42 +1,39 @@
1
  ---
2
- language:
3
- - gl
4
  license: apache-2.0
5
  base_model: openai/whisper-tiny
6
  tags:
7
- - whisper-event
8
  - generated_from_trainer
9
  datasets:
10
- - mozilla-foundation/common_voice_13_0
11
  metrics:
12
  - wer
13
  model-index:
14
- - name: Whisper Tiny Galician
15
  results:
16
  - task:
17
  name: Automatic Speech Recognition
18
  type: automatic-speech-recognition
19
  dataset:
20
- name: mozilla-foundation/common_voice_13_0 gl
21
- type: mozilla-foundation/common_voice_13_0
22
  config: gl
23
  split: test
24
  args: gl
25
  metrics:
26
  - name: Wer
27
  type: wer
28
- value: 26.35037251655629
29
  ---
30
 
31
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
32
  should probably proofread and complete it, then remove this comment. -->
33
 
34
- # Whisper Tiny Galician
35
 
36
- This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the mozilla-foundation/common_voice_13_0 gl dataset.
37
  It achieves the following results on the evaluation set:
38
- - Loss: 0.5832
39
- - Wer: 26.3504
40
 
41
  ## Model description
42
 
@@ -63,21 +60,22 @@ The following hyperparameters were used during training:
63
  - lr_scheduler_type: linear
64
  - lr_scheduler_warmup_steps: 500
65
  - training_steps: 5000
 
66
 
67
  ### Training results
68
 
69
  | Training Loss | Epoch | Step | Validation Loss | Wer |
70
  |:-------------:|:-----:|:----:|:---------------:|:-------:|
71
- | 0.0062 | 19.01 | 1000 | 0.5832 | 26.3504 |
72
- | 0.0012 | 39.01 | 2000 | 0.6527 | 26.7177 |
73
- | 0.0006 | 59.01 | 3000 | 0.6950 | 27.4352 |
74
- | 0.0004 | 79.01 | 4000 | 0.7260 | 28.4044 |
75
- | 0.0003 | 99.01 | 5000 | 0.7315 | 28.1905 |
76
 
77
 
78
  ### Framework versions
79
 
80
- - Transformers 4.33.0.dev0
81
- - Pytorch 2.0.1+cu117
82
- - Datasets 2.14.4
83
- - Tokenizers 0.13.3
 
1
  ---
 
 
2
  license: apache-2.0
3
  base_model: openai/whisper-tiny
4
  tags:
 
5
  - generated_from_trainer
6
  datasets:
7
+ - common_voice_13_0
8
  metrics:
9
  - wer
10
  model-index:
11
+ - name: openai/whisper-tiny
12
  results:
13
  - task:
14
  name: Automatic Speech Recognition
15
  type: automatic-speech-recognition
16
  dataset:
17
+ name: common_voice_13_0
18
+ type: common_voice_13_0
19
  config: gl
20
  split: test
21
  args: gl
22
  metrics:
23
  - name: Wer
24
  type: wer
25
+ value: 26.13307119205298
26
  ---
27
 
28
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
  should probably proofread and complete it, then remove this comment. -->
30
 
31
+ # openai/whisper-tiny
32
 
33
+ This model is a fine-tuned version of [openai/whisper-tiny](https://huggingface.co/openai/whisper-tiny) on the common_voice_13_0 dataset.
34
  It achieves the following results on the evaluation set:
35
+ - Loss: 0.6003
36
+ - Wer: 26.1331
37
 
38
  ## Model description
39
 
 
60
  - lr_scheduler_type: linear
61
  - lr_scheduler_warmup_steps: 500
62
  - training_steps: 5000
63
+ - mixed_precision_training: Native AMP
64
 
65
  ### Training results
66
 
67
  | Training Loss | Epoch | Step | Validation Loss | Wer |
68
  |:-------------:|:-----:|:----:|:---------------:|:-------:|
69
+ | 0.3626 | 20.0 | 1000 | 0.5407 | 30.8464 |
70
+ | 0.1103 | 40.0 | 2000 | 0.5370 | 27.0402 |
71
+ | 0.0473 | 60.0 | 3000 | 0.5769 | 26.7263 |
72
+ | 0.03 | 80.0 | 4000 | 0.5936 | 26.1382 |
73
+ | 0.0244 | 100.0 | 5000 | 0.6003 | 26.1331 |
74
 
75
 
76
  ### Framework versions
77
 
78
+ - Transformers 4.37.2
79
+ - Pytorch 2.2.0+cu121
80
+ - Datasets 2.16.1
81
+ - Tokenizers 0.15.1
generation_config.json CHANGED
@@ -144,10 +144,11 @@
144
  "<|yo|>": 50325,
145
  "<|zh|>": 50260
146
  },
147
- "max_initial_timestamp_index": 1,
148
  "max_length": 448,
149
  "no_timestamps_token_id": 50363,
150
  "pad_token_id": 50257,
 
151
  "return_timestamps": false,
152
  "suppress_tokens": [
153
  1,
@@ -243,5 +244,5 @@
243
  "transcribe": 50359,
244
  "translate": 50358
245
  },
246
- "transformers_version": "4.33.0.dev0"
247
  }
 
144
  "<|yo|>": 50325,
145
  "<|zh|>": 50260
146
  },
147
+ "max_initial_timestamp_index": 50,
148
  "max_length": 448,
149
  "no_timestamps_token_id": 50363,
150
  "pad_token_id": 50257,
151
+ "prev_sot_token_id": 50361,
152
  "return_timestamps": false,
153
  "suppress_tokens": [
154
  1,
 
244
  "transcribe": 50359,
245
  "translate": 50358
246
  },
247
+ "transformers_version": "4.37.2"
248
  }