tmtms commited on
Commit
5931112
·
verified ·
1 Parent(s): 5d5eb09

End of training

Browse files
Files changed (4) hide show
  1. README.md +2 -28
  2. generation_config.json +2 -10
  3. model.safetensors +1 -1
  4. training_args.bin +1 -1
README.md CHANGED
@@ -8,22 +8,9 @@ tags:
8
  - generated_from_trainer
9
  datasets:
10
  - mozilla-foundation/common_voice_11_0
11
- metrics:
12
- - wer
13
  model-index:
14
  - name: Whisper Small Hi - Sanchit Gandhi
15
- results:
16
- - task:
17
- name: Automatic Speech Recognition
18
- type: automatic-speech-recognition
19
- dataset:
20
- name: Common Voice 11.0
21
- type: mozilla-foundation/common_voice_11_0
22
- args: 'config: hi, split: test'
23
- metrics:
24
- - name: Wer
25
- type: wer
26
- value: 6.685740099382623
27
  ---
28
 
29
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,9 +19,6 @@ should probably proofread and complete it, then remove this comment. -->
32
  # Whisper Small Hi - Sanchit Gandhi
33
 
34
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 11.0 dataset.
35
- It achieves the following results on the evaluation set:
36
- - Loss: 0.0912
37
- - Wer: 6.6857
38
 
39
  ## Model description
40
 
@@ -63,19 +47,9 @@ The following hyperparameters were used during training:
63
  - training_steps: 4000
64
  - mixed_precision_training: Native AMP
65
 
66
- ### Training results
67
-
68
- | Training Loss | Epoch | Step | Validation Loss | Wer |
69
- |:-------------:|:------:|:----:|:---------------:|:-------:|
70
- | 0.1441 | 0.7184 | 1000 | 0.1527 | 12.0012 |
71
- | 0.0457 | 1.4368 | 2000 | 0.1101 | 8.5680 |
72
- | 0.015 | 2.1552 | 3000 | 0.0938 | 6.9869 |
73
- | 0.0132 | 2.8736 | 4000 | 0.0912 | 6.6857 |
74
-
75
-
76
  ### Framework versions
77
 
78
  - Transformers 4.49.0
79
  - Pytorch 2.5.1+cu124
80
- - Datasets 3.3.0
81
  - Tokenizers 0.21.0
 
8
  - generated_from_trainer
9
  datasets:
10
  - mozilla-foundation/common_voice_11_0
 
 
11
  model-index:
12
  - name: Whisper Small Hi - Sanchit Gandhi
13
+ results: []
 
 
 
 
 
 
 
 
 
 
 
14
  ---
15
 
16
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
19
  # Whisper Small Hi - Sanchit Gandhi
20
 
21
  This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 11.0 dataset.
 
 
 
22
 
23
  ## Model description
24
 
 
47
  - training_steps: 4000
48
  - mixed_precision_training: Native AMP
49
 
 
 
 
 
 
 
 
 
 
 
50
  ### Framework versions
51
 
52
  - Transformers 4.49.0
53
  - Pytorch 2.5.1+cu124
54
+ - Datasets 3.3.1
55
  - Tokenizers 0.21.0
generation_config.json CHANGED
@@ -48,16 +48,6 @@
48
  "bos_token_id": 50257,
49
  "decoder_start_token_id": 50258,
50
  "eos_token_id": 50257,
51
- "forced_decoder_ids": [
52
- [
53
- 1,
54
- null
55
- ],
56
- [
57
- 2,
58
- 50359
59
- ]
60
- ],
61
  "is_multilingual": true,
62
  "lang_to_id": {
63
  "<|af|>": 50327,
@@ -160,6 +150,7 @@
160
  "<|yo|>": 50325,
161
  "<|zh|>": 50260
162
  },
 
163
  "max_initial_timestamp_index": 50,
164
  "max_length": 448,
165
  "no_timestamps_token_id": 50363,
@@ -254,6 +245,7 @@
254
  50361,
255
  50362
256
  ],
 
257
  "task_to_id": {
258
  "transcribe": 50359,
259
  "translate": 50358
 
48
  "bos_token_id": 50257,
49
  "decoder_start_token_id": 50258,
50
  "eos_token_id": 50257,
 
 
 
 
 
 
 
 
 
 
51
  "is_multilingual": true,
52
  "lang_to_id": {
53
  "<|af|>": 50327,
 
150
  "<|yo|>": 50325,
151
  "<|zh|>": 50260
152
  },
153
+ "language": "korea",
154
  "max_initial_timestamp_index": 50,
155
  "max_length": 448,
156
  "no_timestamps_token_id": 50363,
 
245
  50361,
246
  50362
247
  ],
248
+ "task": "transcribe",
249
  "task_to_id": {
250
  "transcribe": 50359,
251
  "translate": 50358
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aff419c5cb242b9c136afa6bb134ec1218980176be4d61efd76159f5960e4ea1
3
  size 966995080
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d7734884874f1a1513ed9aa760a4f8e97aaa02fd6d93a3a85d27b2ae9ca596b
3
  size 966995080
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef21989ce42cf0659dc8d3acbe3b7a913404c270075e65bfa91dc2ee2ac4846b
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c8b729bb3cde1fd600e37c2070196715389715e2ac60868c27299ce2b739b22
3
  size 5496