tmtms
/

whisper-small-hi

@@ -8,22 +8,9 @@ tags:
 - generated_from_trainer
 datasets:
 - mozilla-foundation/common_voice_11_0
-metrics:
-- wer
 model-index:
 - name: Whisper Small Hi - Sanchit Gandhi
-  results:
-  - task:
-      name: Automatic Speech Recognition
-      type: automatic-speech-recognition
-    dataset:
-      name: Common Voice 11.0
-      type: mozilla-foundation/common_voice_11_0
-      args: 'config: hi, split: test'
-    metrics:
-    - name: Wer
-      type: wer
-      value: 6.685740099382623
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -32,9 +19,6 @@ should probably proofread and complete it, then remove this comment. -->
 # Whisper Small Hi - Sanchit Gandhi
 This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 11.0 dataset.
-It achieves the following results on the evaluation set:
-- Loss: 0.0912
-- Wer: 6.6857
 ## Model description
@@ -63,19 +47,9 @@ The following hyperparameters were used during training:
 - training_steps: 4000
 - mixed_precision_training: Native AMP
-### Training results
-| Training Loss | Epoch  | Step | Validation Loss | Wer     |
-|:-------------:|:------:|:----:|:---------------:|:-------:|
-| 0.1441        | 0.7184 | 1000 | 0.1527          | 12.0012 |
-| 0.0457        | 1.4368 | 2000 | 0.1101          | 8.5680  |
-| 0.015         | 2.1552 | 3000 | 0.0938          | 6.9869  |
-| 0.0132        | 2.8736 | 4000 | 0.0912          | 6.6857  |
 ### Framework versions
 - Transformers 4.49.0
 - Pytorch 2.5.1+cu124
-- Datasets 3.3.0
 - Tokenizers 0.21.0

 - generated_from_trainer
 datasets:
 - mozilla-foundation/common_voice_11_0
 model-index:
 - name: Whisper Small Hi - Sanchit Gandhi
+  results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 # Whisper Small Hi - Sanchit Gandhi
 This model is a fine-tuned version of [openai/whisper-small](https://huggingface.co/openai/whisper-small) on the Common Voice 11.0 dataset.
 ## Model description
 - training_steps: 4000
 - mixed_precision_training: Native AMP
 ### Framework versions
 - Transformers 4.49.0
 - Pytorch 2.5.1+cu124
+- Datasets 3.3.1
 - Tokenizers 0.21.0

generation_config.json CHANGED Viewed

@@ -48,16 +48,6 @@
   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
-  "forced_decoder_ids": [
-    [
-      1,
-      null
-    ],
-    [
-      2,
-      50359
-    ]
-  ],
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
@@ -160,6 +150,7 @@
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
@@ -254,6 +245,7 @@
     50361,
     50362
   ],
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358

   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
     "<|yo|>": 50325,
     "<|zh|>": 50260
   },
+  "language": "korea",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50363,
     50361,
     50362
   ],
+  "task": "transcribe",
   "task_to_id": {
     "transcribe": 50359,
     "translate": 50358

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:aff419c5cb242b9c136afa6bb134ec1218980176be4d61efd76159f5960e4ea1
 size 966995080

 version https://git-lfs.github.com/spec/v1
+oid sha256:1d7734884874f1a1513ed9aa760a4f8e97aaa02fd6d93a3a85d27b2ae9ca596b
 size 966995080

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef21989ce42cf0659dc8d3acbe3b7a913404c270075e65bfa91dc2ee2ac4846b
 size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:0c8b729bb3cde1fd600e37c2070196715389715e2ac60868c27299ce2b739b22
 size 5496