8688chris commited on
Commit
d0ded5e
·
verified ·
1 Parent(s): f34e4d4

Model save

Browse files
Files changed (4) hide show
  1. README.md +37 -37
  2. config.json +7 -6
  3. model.safetensors +2 -2
  4. training_args.bin +1 -1
README.md CHANGED
@@ -1,6 +1,6 @@
1
  ---
2
  license: apache-2.0
3
- base_model: facebook/wav2vec2-large-960h
4
  tags:
5
  - generated_from_trainer
6
  metrics:
@@ -15,10 +15,10 @@ should probably proofread and complete it, then remove this comment. -->
15
 
16
  # Helldivers2ASR_V3
17
 
18
- This model is a fine-tuned version of [facebook/wav2vec2-large-960h](https://huggingface.co/facebook/wav2vec2-large-960h) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
- - Loss: 100.2962
21
- - Wer: 0.2096
22
 
23
  ## Model description
24
 
@@ -37,9 +37,9 @@ More information needed
37
  ### Training hyperparameters
38
 
39
  The following hyperparameters were used during training:
40
- - learning_rate: 0.0005
41
- - train_batch_size: 16
42
- - eval_batch_size: 16
43
  - seed: 42
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: constant
@@ -50,36 +50,36 @@ The following hyperparameters were used during training:
50
 
51
  | Training Loss | Epoch | Step | Validation Loss | Wer |
52
  |:-------------:|:-----:|:----:|:---------------:|:------:|
53
- | 1044.7378 | 1.0 | 328 | 674.2581 | 0.7134 |
54
- | 788.3286 | 2.0 | 656 | 551.7861 | 0.5443 |
55
- | 686.6791 | 3.0 | 984 | 475.5942 | 0.4852 |
56
- | 630.9951 | 4.0 | 1312 | 385.9394 | 0.4615 |
57
- | 591.5513 | 5.0 | 1640 | 375.8221 | 0.4019 |
58
- | 536.7542 | 6.0 | 1968 | 359.7422 | 0.4190 |
59
- | 503.6451 | 7.0 | 2296 | 351.6354 | 0.3961 |
60
- | 469.5973 | 8.0 | 2624 | 303.6820 | 0.3580 |
61
- | 437.5308 | 9.0 | 2952 | 242.7078 | 0.3969 |
62
- | 422.3093 | 10.0 | 3280 | 271.1854 | 0.3764 |
63
- | 409.4765 | 11.0 | 3608 | 281.5080 | 0.3541 |
64
- | 384.7355 | 12.0 | 3936 | 232.6271 | 0.3331 |
65
- | 368.876 | 13.0 | 4264 | 205.0227 | 0.3607 |
66
- | 359.576 | 14.0 | 4592 | 206.7654 | 0.3628 |
67
- | 347.9149 | 15.0 | 4920 | 203.3771 | 0.3131 |
68
- | 324.0592 | 16.0 | 5248 | 195.5896 | 0.3134 |
69
- | 313.765 | 17.0 | 5576 | 187.8961 | 0.2963 |
70
- | 308.2892 | 18.0 | 5904 | 175.5116 | 0.2926 |
71
- | 298.7906 | 19.0 | 6232 | 204.8492 | 0.2947 |
72
- | 276.8503 | 20.0 | 6560 | 174.5410 | 0.2763 |
73
- | 273.6627 | 21.0 | 6888 | 169.8062 | 0.2813 |
74
- | 262.0091 | 22.0 | 7216 | 151.0183 | 0.2493 |
75
- | 256.9988 | 23.0 | 7544 | 146.9712 | 0.2522 |
76
- | 253.0775 | 24.0 | 7872 | 138.4501 | 0.2474 |
77
- | 250.4051 | 25.0 | 8200 | 107.8654 | 0.2112 |
78
- | 247.1768 | 26.0 | 8528 | 113.1651 | 0.2062 |
79
- | 230.0392 | 27.0 | 8856 | 138.3462 | 0.2564 |
80
- | 232.4302 | 28.0 | 9184 | 128.4431 | 0.2469 |
81
- | 225.1965 | 29.0 | 9512 | 108.4411 | 0.2661 |
82
- | 220.6905 | 30.0 | 9840 | 100.2962 | 0.2096 |
83
 
84
 
85
  ### Framework versions
 
1
  ---
2
  license: apache-2.0
3
+ base_model: facebook/wav2vec2-base-960h
4
  tags:
5
  - generated_from_trainer
6
  metrics:
 
15
 
16
  # Helldivers2ASR_V3
17
 
18
+ This model is a fine-tuned version of [facebook/wav2vec2-base-960h](https://huggingface.co/facebook/wav2vec2-base-960h) on an unknown dataset.
19
  It achieves the following results on the evaluation set:
20
+ - Loss: 57.7348
21
+ - Wer: 0.0332
22
 
23
  ## Model description
24
 
 
37
  ### Training hyperparameters
38
 
39
  The following hyperparameters were used during training:
40
+ - learning_rate: 0.0002
41
+ - train_batch_size: 32
42
+ - eval_batch_size: 32
43
  - seed: 42
44
  - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
45
  - lr_scheduler_type: constant
 
50
 
51
  | Training Loss | Epoch | Step | Validation Loss | Wer |
52
  |:-------------:|:-----:|:----:|:---------------:|:------:|
53
+ | 1440.5784 | 1.0 | 165 | 827.7584 | 0.3982 |
54
+ | 901.7305 | 2.0 | 330 | 516.9960 | 0.2632 |
55
+ | 680.9522 | 3.0 | 495 | 461.0711 | 0.2190 |
56
+ | 572.9876 | 4.0 | 660 | 373.8802 | 0.1709 |
57
+ | 455.9722 | 5.0 | 825 | 325.0266 | 0.1536 |
58
+ | 405.2042 | 6.0 | 990 | 315.5705 | 0.1397 |
59
+ | 335.4539 | 7.0 | 1155 | 229.3944 | 0.1115 |
60
+ | 311.7148 | 8.0 | 1320 | 184.8958 | 0.0918 |
61
+ | 292.6152 | 9.0 | 1485 | 177.3645 | 0.0840 |
62
+ | 268.9287 | 10.0 | 1650 | 150.6056 | 0.0748 |
63
+ | 224.9027 | 11.0 | 1815 | 134.2426 | 0.0746 |
64
+ | 221.6842 | 12.0 | 1980 | 152.2036 | 0.0633 |
65
+ | 216.7037 | 13.0 | 2145 | 94.9223 | 0.0510 |
66
+ | 163.8511 | 14.0 | 2310 | 93.6272 | 0.0395 |
67
+ | 169.5703 | 15.0 | 2475 | 124.6715 | 0.0568 |
68
+ | 149.0854 | 16.0 | 2640 | 133.8979 | 0.0607 |
69
+ | 157.8008 | 17.0 | 2805 | 66.3784 | 0.0330 |
70
+ | 147.502 | 18.0 | 2970 | 71.3790 | 0.0335 |
71
+ | 148.8542 | 19.0 | 3135 | 72.7481 | 0.0419 |
72
+ | 136.0251 | 20.0 | 3300 | 129.4439 | 0.0523 |
73
+ | 129.7949 | 21.0 | 3465 | 49.1545 | 0.0262 |
74
+ | 126.8121 | 22.0 | 3630 | 67.8833 | 0.0343 |
75
+ | 126.8445 | 23.0 | 3795 | 66.8705 | 0.0327 |
76
+ | 127.7805 | 24.0 | 3960 | 70.8930 | 0.0309 |
77
+ | 113.9002 | 25.0 | 4125 | 44.5920 | 0.0233 |
78
+ | 102.9785 | 26.0 | 4290 | 65.2669 | 0.0280 |
79
+ | 107.9157 | 27.0 | 4455 | 39.7528 | 0.0212 |
80
+ | 103.8186 | 28.0 | 4620 | 46.9734 | 0.0246 |
81
+ | 103.4841 | 29.0 | 4785 | 58.0863 | 0.0264 |
82
+ | 81.7682 | 30.0 | 4950 | 57.7348 | 0.0332 |
83
 
84
 
85
  ### Framework versions
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "facebook/wav2vec2-large-960h",
3
  "activation_dropout": 0.1,
4
  "adapter_attn_dim": null,
5
  "adapter_kernel_size": 3,
@@ -53,12 +53,13 @@
53
  "feat_proj_dropout": 0.1,
54
  "feat_quantizer_dropout": 0.0,
55
  "final_dropout": 0.15,
 
56
  "hidden_act": "gelu",
57
  "hidden_dropout": 0.15,
58
  "hidden_dropout_prob": 0.1,
59
- "hidden_size": 1024,
60
  "initializer_range": 0.02,
61
- "intermediate_size": 4096,
62
  "layer_norm_eps": 1e-05,
63
  "layerdrop": 0.1,
64
  "mask_feature_length": 10,
@@ -69,15 +70,15 @@
69
  "mask_time_prob": 0.05,
70
  "model_type": "wav2vec2",
71
  "num_adapter_layers": 3,
72
- "num_attention_heads": 16,
73
  "num_codevector_groups": 2,
74
  "num_codevectors_per_group": 320,
75
  "num_conv_pos_embedding_groups": 16,
76
  "num_conv_pos_embeddings": 128,
77
  "num_feat_extract_layers": 7,
78
- "num_hidden_layers": 24,
79
  "num_negatives": 100,
80
- "output_hidden_size": 1024,
81
  "pad_token_id": 0,
82
  "proj_codevector_dim": 256,
83
  "tdnn_dilation": [
 
1
  {
2
+ "_name_or_path": "facebook/wav2vec2-base-960h",
3
  "activation_dropout": 0.1,
4
  "adapter_attn_dim": null,
5
  "adapter_kernel_size": 3,
 
53
  "feat_proj_dropout": 0.1,
54
  "feat_quantizer_dropout": 0.0,
55
  "final_dropout": 0.15,
56
+ "gradient_checkpointing": false,
57
  "hidden_act": "gelu",
58
  "hidden_dropout": 0.15,
59
  "hidden_dropout_prob": 0.1,
60
+ "hidden_size": 768,
61
  "initializer_range": 0.02,
62
+ "intermediate_size": 3072,
63
  "layer_norm_eps": 1e-05,
64
  "layerdrop": 0.1,
65
  "mask_feature_length": 10,
 
70
  "mask_time_prob": 0.05,
71
  "model_type": "wav2vec2",
72
  "num_adapter_layers": 3,
73
+ "num_attention_heads": 12,
74
  "num_codevector_groups": 2,
75
  "num_codevectors_per_group": 320,
76
  "num_conv_pos_embedding_groups": 16,
77
  "num_conv_pos_embeddings": 128,
78
  "num_feat_extract_layers": 7,
79
+ "num_hidden_layers": 12,
80
  "num_negatives": 100,
81
+ "output_hidden_size": 768,
82
  "pad_token_id": 0,
83
  "proj_codevector_dim": 256,
84
  "tdnn_dilation": [
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cf39c3bad3692b8ada5e3dbea6704a07b1768bafeeb113bc0fc2160f0feba24a
3
- size 1261897368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d81fe311e050fc59cbc06a44537263e8399d7b27e2915852a9aeb51171a1e58b
3
+ size 377611120
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c6e5da415c451c4bb69a5677f24ce26f9e584b30080767c1bfc04bf9fccee97
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:837b93a71322b18603c527653dcae8bb68872145d8929ffaa0f6430370f6b1c6
3
  size 5176