Model save

Browse files

Files changed (5) hide show

README.md +40 -41
config.json +8 -8
model.safetensors +2 -2
tokenizer_config.json +1 -2
training_args.bin +2 -2

README.md CHANGED Viewed

@@ -1,7 +1,6 @@
 ---
-library_name: transformers
 license: apache-2.0
-base_model: facebook/wav2vec2-base-960h
 tags:
 - generated_from_trainer
 metrics:
@@ -16,10 +15,10 @@ should probably proofread and complete it, then remove this comment. -->
 # Helldivers2ASR_V3
-This model is a fine-tuned version of [facebook/wav2vec2-base-960h](https://huggingface.co/facebook/wav2vec2-base-960h) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 46.4982
-- Wer: 0.0197
 ## Model description
@@ -38,11 +37,11 @@ More information needed
 ### Training hyperparameters
 The following hyperparameters were used during training:
-- learning_rate: 7e-05
-- train_batch_size: 32
-- eval_batch_size: 32
 - seed: 42
-- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: constant
 - num_epochs: 30
 - mixed_precision_training: Native AMP
@@ -51,41 +50,41 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss | Wer    |
 |:-------------:|:-----:|:----:|:---------------:|:------:|
-| 1568.7385     | 1.0   | 164  | 771.7803        | 0.3712 |
-| 1068.8207     | 2.0   | 328  | 590.2993        | 0.2698 |
-| 860.8321      | 3.0   | 492  | 448.1273        | 0.2125 |
-| 747.6548      | 4.0   | 656  | 366.1845        | 0.1805 |
-| 631.9949      | 5.0   | 820  | 274.8642        | 0.1421 |
-| 571.2026      | 6.0   | 984  | 241.3273        | 0.1242 |
-| 509.5936      | 7.0   | 1148 | 216.0463        | 0.1093 |
-| 435.6571      | 8.0   | 1312 | 176.9057        | 0.0875 |
-| 411.174       | 9.0   | 1476 | 165.9831        | 0.0833 |
-| 364.6828      | 10.0  | 1640 | 138.6788        | 0.0712 |
-| 345.6405      | 11.0  | 1804 | 136.7265        | 0.0675 |
-| 315.1662      | 12.0  | 1968 | 114.3673        | 0.0570 |
-| 284.2125      | 13.0  | 2132 | 98.1911         | 0.0520 |
-| 278.4242      | 14.0  | 2296 | 94.5904         | 0.0457 |
-| 238.8668      | 15.0  | 2460 | 86.1799         | 0.0465 |
-| 235.9656      | 16.0  | 2624 | 79.9327         | 0.0444 |
-| 224.2061      | 17.0  | 2788 | 66.6601         | 0.0331 |
-| 209.7441      | 18.0  | 2952 | 61.5226         | 0.0307 |
-| 197.9857      | 19.0  | 3116 | 59.2185         | 0.0286 |
-| 189.3057      | 20.0  | 3280 | 55.8568         | 0.0278 |
-| 201.0874      | 21.0  | 3444 | 58.7346         | 0.0268 |
-| 152.8864      | 22.0  | 3608 | 60.1501         | 0.0226 |
-| 161.5389      | 23.0  | 3772 | 61.3434         | 0.0273 |
-| 151.5226      | 24.0  | 3936 | 46.0442         | 0.0208 |
-| 154.1182      | 25.0  | 4100 | 49.2783         | 0.0200 |
-| 157.7021      | 26.0  | 4264 | 39.4705         | 0.0202 |
-| 143.6331      | 27.0  | 4428 | 44.7556         | 0.0234 |
-| 136.6361      | 28.0  | 4592 | 39.5889         | 0.0192 |
-| 133.5365      | 29.0  | 4756 | 42.7637         | 0.0173 |
-| 117.5687      | 30.0  | 4920 | 46.4982         | 0.0197 |
 ### Framework versions
-- Transformers 4.57.3
 - Pytorch 2.5.1+cu121
 - Datasets 3.6.0
-- Tokenizers 0.22.1

 ---
 license: apache-2.0
+base_model: facebook/wav2vec2-large-960h
 tags:
 - generated_from_trainer
 metrics:
 # Helldivers2ASR_V3
+This model is a fine-tuned version of [facebook/wav2vec2-large-960h](https://huggingface.co/facebook/wav2vec2-large-960h) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 100.2962
+- Wer: 0.2096
 ## Model description
 ### Training hyperparameters
 The following hyperparameters were used during training:
+- learning_rate: 0.0005
+- train_batch_size: 16
+- eval_batch_size: 16
 - seed: 42
+- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
 - lr_scheduler_type: constant
 - num_epochs: 30
 - mixed_precision_training: Native AMP
 | Training Loss | Epoch | Step | Validation Loss | Wer    |
 |:-------------:|:-----:|:----:|:---------------:|:------:|
+| 1044.7378     | 1.0   | 328  | 674.2581        | 0.7134 |
+| 788.3286      | 2.0   | 656  | 551.7861        | 0.5443 |
+| 686.6791      | 3.0   | 984  | 475.5942        | 0.4852 |
+| 630.9951      | 4.0   | 1312 | 385.9394        | 0.4615 |
+| 591.5513      | 5.0   | 1640 | 375.8221        | 0.4019 |
+| 536.7542      | 6.0   | 1968 | 359.7422        | 0.4190 |
+| 503.6451      | 7.0   | 2296 | 351.6354        | 0.3961 |
+| 469.5973      | 8.0   | 2624 | 303.6820        | 0.3580 |
+| 437.5308      | 9.0   | 2952 | 242.7078        | 0.3969 |
+| 422.3093      | 10.0  | 3280 | 271.1854        | 0.3764 |
+| 409.4765      | 11.0  | 3608 | 281.5080        | 0.3541 |
+| 384.7355      | 12.0  | 3936 | 232.6271        | 0.3331 |
+| 368.876       | 13.0  | 4264 | 205.0227        | 0.3607 |
+| 359.576       | 14.0  | 4592 | 206.7654        | 0.3628 |
+| 347.9149      | 15.0  | 4920 | 203.3771        | 0.3131 |
+| 324.0592      | 16.0  | 5248 | 195.5896        | 0.3134 |
+| 313.765       | 17.0  | 5576 | 187.8961        | 0.2963 |
+| 308.2892      | 18.0  | 5904 | 175.5116        | 0.2926 |
+| 298.7906      | 19.0  | 6232 | 204.8492        | 0.2947 |
+| 276.8503      | 20.0  | 6560 | 174.5410        | 0.2763 |
+| 273.6627      | 21.0  | 6888 | 169.8062        | 0.2813 |
+| 262.0091      | 22.0  | 7216 | 151.0183        | 0.2493 |
+| 256.9988      | 23.0  | 7544 | 146.9712        | 0.2522 |
+| 253.0775      | 24.0  | 7872 | 138.4501        | 0.2474 |
+| 250.4051      | 25.0  | 8200 | 107.8654        | 0.2112 |
+| 247.1768      | 26.0  | 8528 | 113.1651        | 0.2062 |
+| 230.0392      | 27.0  | 8856 | 138.3462        | 0.2564 |
+| 232.4302      | 28.0  | 9184 | 128.4431        | 0.2469 |
+| 225.1965      | 29.0  | 9512 | 108.4411        | 0.2661 |
+| 220.6905      | 30.0  | 9840 | 100.2962        | 0.2096 |
 ### Framework versions
+- Transformers 4.44.0
 - Pytorch 2.5.1+cu121
 - Datasets 3.6.0
+- Tokenizers 0.19.1

config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "activation_dropout": 0.1,
   "adapter_attn_dim": null,
   "adapter_kernel_size": 3,
@@ -45,7 +46,6 @@
   "ctc_zero_infinity": false,
   "diversity_loss_weight": 0.1,
   "do_stable_layer_norm": false,
-  "dtype": "float32",
   "eos_token_id": 2,
   "feat_extract_activation": "gelu",
   "feat_extract_dropout": 0.0,
@@ -53,13 +53,12 @@
   "feat_proj_dropout": 0.1,
   "feat_quantizer_dropout": 0.0,
   "final_dropout": 0.15,
-  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout": 0.15,
   "hidden_dropout_prob": 0.1,
-  "hidden_size": 768,
   "initializer_range": 0.02,
-  "intermediate_size": 3072,
   "layer_norm_eps": 1e-05,
   "layerdrop": 0.1,
   "mask_feature_length": 10,
@@ -70,15 +69,15 @@
   "mask_time_prob": 0.05,
   "model_type": "wav2vec2",
   "num_adapter_layers": 3,
-  "num_attention_heads": 12,
   "num_codevector_groups": 2,
   "num_codevectors_per_group": 320,
   "num_conv_pos_embedding_groups": 16,
   "num_conv_pos_embeddings": 128,
   "num_feat_extract_layers": 7,
-  "num_hidden_layers": 12,
   "num_negatives": 100,
-  "output_hidden_size": 768,
   "pad_token_id": 0,
   "proj_codevector_dim": 256,
   "tdnn_dilation": [
@@ -102,7 +101,8 @@
     1,
     1
   ],
-  "transformers_version": "4.57.3",
   "use_weighted_layer_sum": false,
   "vocab_size": 32,
   "xvector_output_dim": 512

 {
+  "_name_or_path": "facebook/wav2vec2-large-960h",
   "activation_dropout": 0.1,
   "adapter_attn_dim": null,
   "adapter_kernel_size": 3,
   "ctc_zero_infinity": false,
   "diversity_loss_weight": 0.1,
   "do_stable_layer_norm": false,
   "eos_token_id": 2,
   "feat_extract_activation": "gelu",
   "feat_extract_dropout": 0.0,
   "feat_proj_dropout": 0.1,
   "feat_quantizer_dropout": 0.0,
   "final_dropout": 0.15,
   "hidden_act": "gelu",
   "hidden_dropout": 0.15,
   "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
   "initializer_range": 0.02,
+  "intermediate_size": 4096,
   "layer_norm_eps": 1e-05,
   "layerdrop": 0.1,
   "mask_feature_length": 10,
   "mask_time_prob": 0.05,
   "model_type": "wav2vec2",
   "num_adapter_layers": 3,
+  "num_attention_heads": 16,
   "num_codevector_groups": 2,
   "num_codevectors_per_group": 320,
   "num_conv_pos_embedding_groups": 16,
   "num_conv_pos_embeddings": 128,
   "num_feat_extract_layers": 7,
+  "num_hidden_layers": 24,
   "num_negatives": 100,
+  "output_hidden_size": 1024,
   "pad_token_id": 0,
   "proj_codevector_dim": 256,
   "tdnn_dilation": [
     1,
     1
   ],
+  "torch_dtype": "float32",
+  "transformers_version": "4.44.0",
   "use_weighted_layer_sum": false,
   "vocab_size": 32,
   "xvector_output_dim": 512

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50f75135f3205e071dffd7a5c9092a6319d6153256e8171dd3951b85377acaa1
-size 377611120

 version https://git-lfs.github.com/spec/v1
+oid sha256:cf39c3bad3692b8ada5e3dbea6704a07b1768bafeeb113bc0fc2160f0feba24a
+size 1261897368

tokenizer_config.json CHANGED Viewed

@@ -34,11 +34,10 @@
     }
   },
   "bos_token": "<s>",
-  "clean_up_tokenization_spaces": false,
   "do_lower_case": false,
   "do_normalize": true,
   "eos_token": "</s>",
-  "extra_special_tokens": {},
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",
   "processor_class": "Wav2Vec2Processor",

     }
   },
   "bos_token": "<s>",
+  "clean_up_tokenization_spaces": true,
   "do_lower_case": false,
   "do_normalize": true,
   "eos_token": "</s>",
   "model_max_length": 1000000000000000019884624838656,
   "pad_token": "<pad>",
   "processor_class": "Wav2Vec2Processor",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bb8d8ecf665cf5a646bf6c6c5ea1422b8f2ac7fd9a95644e4e45fa189a41e155
-size 5432

 version https://git-lfs.github.com/spec/v1
+oid sha256:4c6e5da415c451c4bb69a5677f24ce26f9e584b30080767c1bfc04bf9fccee97
+size 5176